{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "301cd314",
   "metadata": {},
   "source": [
    "### 1.拿到文本doc"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "c29ec30a",
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "from tqdm import tqdm"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "87fc9023",
   "metadata": {},
   "source": [
    "#### 专利"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "0cf0b78f",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>编号</th>\n",
       "      <th>PN 专利号</th>\n",
       "      <th>类别</th>\n",
       "      <th>标引</th>\n",
       "      <th>TI 文献标题</th>\n",
       "      <th>预处理文本</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>patent0</td>\n",
       "      <td>CN102017938-A</td>\n",
       "      <td>技术</td>\n",
       "      <td>3.0</td>\n",
       "      <td>Greenhouse suspended self-propelled target    ...</td>\n",
       "      <td>greenhouse suspend self-propelled target spray...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>patent1</td>\n",
       "      <td>DE102010033115-A1;  WO2012016974-A1</td>\n",
       "      <td>机械手</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Unloading manipulator for unloading cargo from...</td>\n",
       "      <td>unload manipulator unload cargo container carg...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>patent2</td>\n",
       "      <td>DE10250227-A1</td>\n",
       "      <td>技术</td>\n",
       "      <td>3.0</td>\n",
       "      <td>Expansion device for connection to data-bus e....</td>\n",
       "      <td>expansion device connection data-bus e.g envir...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>patent3</td>\n",
       "      <td>JP2003168326-A</td>\n",
       "      <td>工业机器人</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Cable harness for industrial robot, has pair o...</td>\n",
       "      <td>cable harness industrial robot pair support ca...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>patent4</td>\n",
       "      <td>CN101774174-A</td>\n",
       "      <td>技术</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Parallel mechanism for e.g. space manipulator,...</td>\n",
       "      <td>parallel mechanism e.g space manipulator movea...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "        编号                               PN 专利号     类别   标引  \\\n",
       "0  patent0                        CN102017938-A     技术  3.0   \n",
       "1  patent1  DE102010033115-A1;  WO2012016974-A1    机械手  NaN   \n",
       "2  patent2                        DE10250227-A1     技术  3.0   \n",
       "3  patent3                       JP2003168326-A  工业机器人  NaN   \n",
       "4  patent4                        CN101774174-A     技术  NaN   \n",
       "\n",
       "                                             TI 文献标题  \\\n",
       "0  Greenhouse suspended self-propelled target    ...   \n",
       "1  Unloading manipulator for unloading cargo from...   \n",
       "2  Expansion device for connection to data-bus e....   \n",
       "3  Cable harness for industrial robot, has pair o...   \n",
       "4  Parallel mechanism for e.g. space manipulator,...   \n",
       "\n",
       "                                               预处理文本  \n",
       "0  greenhouse suspend self-propelled target spray...  \n",
       "1  unload manipulator unload cargo container carg...  \n",
       "2  expansion device connection data-bus e.g envir...  \n",
       "3  cable harness industrial robot pair support ca...  \n",
       "4  parallel mechanism e.g space manipulator movea...  "
      ]
     },
     "execution_count": 2,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 预处理过的标题 摘要\n",
    "df = pd.read_excel(r'D:\\jupyter\\DK\\DK数据\\2数据处理\\专利\\2预处理.xlsx')\n",
    "df.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "71369c55",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(88529, 6)"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df.shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "8ec2fc41",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "e8d14f4a",
   "metadata": {},
   "outputs": [],
   "source": [
    "data = pd.read_excel(r'D:\\jupyter\\DK\\DK数据\\2数据处理\\分类结果\\专利-分类为0-原始标记为2.xlsx')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "062373b8",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(19256, 32)\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>编号</th>\n",
       "      <th>PN 专利号</th>\n",
       "      <th>类别</th>\n",
       "      <th>标引</th>\n",
       "      <th>TI 文献标题</th>\n",
       "      <th>编号.1</th>\n",
       "      <th>PN 专利号.1</th>\n",
       "      <th>类别.1</th>\n",
       "      <th>标引.1</th>\n",
       "      <th>TI 文献标题.1</th>\n",
       "      <th>...</th>\n",
       "      <th>PI 优先权申请信息和日期</th>\n",
       "      <th>DS 指定国家（地区）/区域</th>\n",
       "      <th>FS 检索字段</th>\n",
       "      <th>CP 此专利参考的专利信息</th>\n",
       "      <th>CR 此专利引用的非专利信息</th>\n",
       "      <th>DN 化合物</th>\n",
       "      <th>MN Markush 号</th>\n",
       "      <th>RI ResearcherID 号</th>\n",
       "      <th>CI Derwent 化合物号</th>\n",
       "      <th>RG Derwent 注册号</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>patent76290</td>\n",
       "      <td>WO2020041221-A1</td>\n",
       "      <td>应用</td>\n",
       "      <td>0</td>\n",
       "      <td>Method for facilitating product-by-process for...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>WO2020041221-A1</td>\n",
       "      <td>应用</td>\n",
       "      <td>2.0</td>\n",
       "      <td>Method for facilitating product-by-process for...</td>\n",
       "      <td>...</td>\n",
       "      <td>US719738P    20 Aug 2018;  US719741P    20 Aug...</td>\n",
       "      <td>WO2020041221-A1:      (National): AE;  AG;  AL...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>WO2020041221-A1 -- CN107932550-A   UNIV NORTHW...</td>\n",
       "      <td>WO2020041221-A1  CHRIST JOSEF F ET          AL...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>patent66777</td>\n",
       "      <td>CN112784676-A</td>\n",
       "      <td>应用</td>\n",
       "      <td>0</td>\n",
       "      <td>Method for processing image in robot, involves...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>CN112784676-A</td>\n",
       "      <td>应用</td>\n",
       "      <td>2.0</td>\n",
       "      <td>Method for processing image in robot, involves...</td>\n",
       "      <td>...</td>\n",
       "      <td>CN11410238    04 Dec 2020</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>patent55578</td>\n",
       "      <td>CN108759672-A;  CN108759672-B</td>\n",
       "      <td>应用</td>\n",
       "      <td>0</td>\n",
       "      <td>Industrial robot end position measurement and ...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>CN108759672-A;  CN108759672-B</td>\n",
       "      <td>应用</td>\n",
       "      <td>2.0</td>\n",
       "      <td>Industrial robot end position measurement and ...</td>\n",
       "      <td>...</td>\n",
       "      <td>CN10624662    16 Jun 2018</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>CN108759672-A -- CN104406585-A   HANGZHOU INST...</td>\n",
       "      <td>CN108759672-A  : \"\",          ,relevantClaims[...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>patent31925</td>\n",
       "      <td>CN106289378-A;  CN106289378-B</td>\n",
       "      <td>技术</td>\n",
       "      <td>0</td>\n",
       "      <td>Laser tracker based industrial robot performan...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>CN106289378-A;  CN106289378-B</td>\n",
       "      <td>技术</td>\n",
       "      <td>2.0</td>\n",
       "      <td>Laser tracker based industrial robot performan...</td>\n",
       "      <td>...</td>\n",
       "      <td>CN10664737    12 Aug 2016</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>CN106289378-A -- CN102062576-A   UNIV ZHEJIANG...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>patent67950</td>\n",
       "      <td>CN109664291-A</td>\n",
       "      <td>应用</td>\n",
       "      <td>0</td>\n",
       "      <td>Robot guiding method, involves performing imag...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>CN109664291-A</td>\n",
       "      <td>应用</td>\n",
       "      <td>2.0</td>\n",
       "      <td>Robot guiding method, involves performing imag...</td>\n",
       "      <td>...</td>\n",
       "      <td>CN10957526    13 Oct 2017</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>5 rows × 32 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "            编号                         PN 专利号  类别  标引  \\\n",
       "0  patent76290                WO2020041221-A1  应用   0   \n",
       "1  patent66777                  CN112784676-A  应用   0   \n",
       "2  patent55578  CN108759672-A;  CN108759672-B  应用   0   \n",
       "3  patent31925  CN106289378-A;  CN106289378-B  技术   0   \n",
       "4  patent67950                  CN109664291-A  应用   0   \n",
       "\n",
       "                                             TI 文献标题  编号.1  \\\n",
       "0  Method for facilitating product-by-process for...   NaN   \n",
       "1  Method for processing image in robot, involves...   NaN   \n",
       "2  Industrial robot end position measurement and ...   NaN   \n",
       "3  Laser tracker based industrial robot performan...   NaN   \n",
       "4  Robot guiding method, involves performing imag...   NaN   \n",
       "\n",
       "                        PN 专利号.1 类别.1  标引.1  \\\n",
       "0                WO2020041221-A1   应用   2.0   \n",
       "1                  CN112784676-A   应用   2.0   \n",
       "2  CN108759672-A;  CN108759672-B   应用   2.0   \n",
       "3  CN106289378-A;  CN106289378-B   技术   2.0   \n",
       "4                  CN109664291-A   应用   2.0   \n",
       "\n",
       "                                           TI 文献标题.1  ...  \\\n",
       "0  Method for facilitating product-by-process for...  ...   \n",
       "1  Method for processing image in robot, involves...  ...   \n",
       "2  Industrial robot end position measurement and ...  ...   \n",
       "3  Laser tracker based industrial robot performan...  ...   \n",
       "4  Robot guiding method, involves performing imag...  ...   \n",
       "\n",
       "                                       PI 优先权申请信息和日期  \\\n",
       "0  US719738P    20 Aug 2018;  US719741P    20 Aug...   \n",
       "1                          CN11410238    04 Dec 2020   \n",
       "2                          CN10624662    16 Jun 2018   \n",
       "3                          CN10664737    12 Aug 2016   \n",
       "4                          CN10957526    13 Oct 2017   \n",
       "\n",
       "                                      DS 指定国家（地区）/区域  FS 检索字段  \\\n",
       "0  WO2020041221-A1:      (National): AE;  AG;  AL...      NaN   \n",
       "1                                                NaN      NaN   \n",
       "2                                                NaN      NaN   \n",
       "3                                                NaN      NaN   \n",
       "4                                                NaN      NaN   \n",
       "\n",
       "                                       CP 此专利参考的专利信息  \\\n",
       "0  WO2020041221-A1 -- CN107932550-A   UNIV NORTHW...   \n",
       "1                                                NaN   \n",
       "2  CN108759672-A -- CN104406585-A   HANGZHOU INST...   \n",
       "3  CN106289378-A -- CN102062576-A   UNIV ZHEJIANG...   \n",
       "4                                                NaN   \n",
       "\n",
       "                                      CR 此专利引用的非专利信息  DN 化合物  MN Markush 号  \\\n",
       "0  WO2020041221-A1  CHRIST JOSEF F ET          AL...     NaN           NaN   \n",
       "1                                                NaN     NaN           NaN   \n",
       "2  CN108759672-A  : \"\",          ,relevantClaims[...     NaN           NaN   \n",
       "3                                                NaN     NaN           NaN   \n",
       "4                                                NaN     NaN           NaN   \n",
       "\n",
       "   RI ResearcherID 号  CI Derwent 化合物号  RG Derwent 注册号  \n",
       "0                NaN              NaN             NaN  \n",
       "1                NaN              NaN             NaN  \n",
       "2                NaN              NaN             NaN  \n",
       "3                NaN              NaN             NaN  \n",
       "4                NaN              NaN             NaN  \n",
       "\n",
       "[5 rows x 32 columns]"
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "print(data.shape)\n",
    "data.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "c8a72840",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "Index(['编号', 'PN 专利号', '类别', '标引', ' TI 文献标题', '编号.1', 'PN 专利号.1', '类别.1',\n",
       "       '标引.1', ' TI 文献标题.1', ' AU 作者', ' AE 专利权人', ' GA 德温特主入藏号', ' AB 摘要',\n",
       "       ' TF  技术焦点摘要', ' EA 提前访问日期', ' DC 德温特分类代码', ' MC 德温特手工代码',\n",
       "       ' IP 国际专利分类号', ' PD 专利详细信息', ' AD 申请详细信息', ' FD 更多申请详细信息',\n",
       "       ' PI 优先权申请信息和日期', ' DS 指定国家（地区）/区域', ' FS 检索字段', ' CP 此专利参考的专利信息',\n",
       "       ' CR 此专利引用的非专利信息', ' DN 化合物', ' MN Markush 号', ' RI ResearcherID 号',\n",
       "       ' CI Derwent 化合物号', ' RG Derwent 注册号'],\n",
       "      dtype='object')"
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "data.columns"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "15649316",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array(['patent76290', 'patent66777', 'patent55578', ..., 'patent88463',\n",
       "       'patent88484', 'patent88521'], dtype=object)"
      ]
     },
     "execution_count": 7,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "bianhao = data['编号'].values\n",
    "bianhao"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "e1380b78",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|███████████████████████████████████████████████████████████████████████████| 19256/19256 [02:42<00:00, 118.45it/s]\n"
     ]
    }
   ],
   "source": [
    "idx_ls =[]\n",
    "for i in tqdm(range(len(bianhao))):\n",
    "    ii = bianhao[i]\n",
    "    idx = df[df['编号'] == ii].index\n",
    "    idx_ls.append(idx[0])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "2417afc0",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "19256"
      ]
     },
     "execution_count": 9,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "len(idx_ls)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "0ac472ec",
   "metadata": {},
   "outputs": [],
   "source": [
    "df1 = df.iloc[idx_ls,[5]].reset_index(drop = True)\n",
    "df2 = data[['编号', 'PN 专利号', ' TI 文献标题', ' AD 申请详细信息']].reset_index(drop = True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "695fabc7",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(19256, 5)\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>编号</th>\n",
       "      <th>PN 专利号</th>\n",
       "      <th>TI 文献标题</th>\n",
       "      <th>AD 申请详细信息</th>\n",
       "      <th>预处理文本</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>patent76290</td>\n",
       "      <td>WO2020041221-A1</td>\n",
       "      <td>Method for facilitating product-by-process for...</td>\n",
       "      <td>WO2020041221-A1    WOUS047124    20 Aug 2019</td>\n",
       "      <td>method facilitate product-by-process construct...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>patent66777</td>\n",
       "      <td>CN112784676-A</td>\n",
       "      <td>Method for processing image in robot, involves...</td>\n",
       "      <td>CN112784676-A    CN11410238    04 Dec 2020</td>\n",
       "      <td>method process image robot involve analyze hum...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>patent55578</td>\n",
       "      <td>CN108759672-A;  CN108759672-B</td>\n",
       "      <td>Industrial robot end position measurement and ...</td>\n",
       "      <td>CN108759672-A    CN10624662    16 Jun 2018;   ...</td>\n",
       "      <td>industrial robot position measurement displace...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>patent31925</td>\n",
       "      <td>CN106289378-A;  CN106289378-B</td>\n",
       "      <td>Laser tracker based industrial robot performan...</td>\n",
       "      <td>CN106289378-A    CN10664737    12 Aug 2016;   ...</td>\n",
       "      <td>laser tracker base industrial robot performanc...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>patent67950</td>\n",
       "      <td>CN109664291-A</td>\n",
       "      <td>Robot guiding method, involves performing imag...</td>\n",
       "      <td>CN109664291-A    CN10957526    13 Oct 2017</td>\n",
       "      <td>robot guide method involve perform image proce...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "            编号                         PN 专利号  \\\n",
       "0  patent76290                WO2020041221-A1   \n",
       "1  patent66777                  CN112784676-A   \n",
       "2  patent55578  CN108759672-A;  CN108759672-B   \n",
       "3  patent31925  CN106289378-A;  CN106289378-B   \n",
       "4  patent67950                  CN109664291-A   \n",
       "\n",
       "                                             TI 文献标题  \\\n",
       "0  Method for facilitating product-by-process for...   \n",
       "1  Method for processing image in robot, involves...   \n",
       "2  Industrial robot end position measurement and ...   \n",
       "3  Laser tracker based industrial robot performan...   \n",
       "4  Robot guiding method, involves performing imag...   \n",
       "\n",
       "                                           AD 申请详细信息  \\\n",
       "0       WO2020041221-A1    WOUS047124    20 Aug 2019   \n",
       "1         CN112784676-A    CN11410238    04 Dec 2020   \n",
       "2  CN108759672-A    CN10624662    16 Jun 2018;   ...   \n",
       "3  CN106289378-A    CN10664737    12 Aug 2016;   ...   \n",
       "4         CN109664291-A    CN10957526    13 Oct 2017   \n",
       "\n",
       "                                               预处理文本  \n",
       "0  method facilitate product-by-process construct...  \n",
       "1  method process image robot involve analyze hum...  \n",
       "2  industrial robot position measurement displace...  \n",
       "3  laser tracker base industrial robot performanc...  \n",
       "4  robot guide method involve perform image proce...  "
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "new_data = pd.concat([df2,df1],axis=1)\n",
    "print(new_data.shape)\n",
    "new_data.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "72359509",
   "metadata": {},
   "outputs": [],
   "source": [
    "new_data.to_excel(r'D:\\jupyter\\DK\\DK数据\\2数据处理\\3聚类\\2应用研究\\1语料-专利.xlsx',index = False)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "fd2eda7d",
   "metadata": {},
   "source": [
    "#### 论文"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "aba2d12e",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>编号</th>\n",
       "      <th>标引</th>\n",
       "      <th>TI 文献标题</th>\n",
       "      <th>预处理文本</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>2.0</td>\n",
       "      <td>Sensor terminal \"Portable\" for intelligent nav...</td>\n",
       "      <td>sensor terminal portable intelligent navigatio...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>1.0</td>\n",
       "      <td>A Mobile Robot Tracking using Kalman Filter-ba...</td>\n",
       "      <td>mobile robot track kalman filter-based gaussia...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Global and Local Path Planning on Robotic Whee...</td>\n",
       "      <td>global local path planning robotic wheelchair ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4</td>\n",
       "      <td>2.0</td>\n",
       "      <td>Whisker sensor design for three dimensional po...</td>\n",
       "      <td>whisker sensor design dimensional position mea...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>5</td>\n",
       "      <td>2.0</td>\n",
       "      <td>Applying Deep Reinforcement Learning to Cable ...</td>\n",
       "      <td>apply deep reinforcement learn cable drive par...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   编号   标引                                            TI 文献标题  \\\n",
       "0   1  2.0  Sensor terminal \"Portable\" for intelligent nav...   \n",
       "1   2  1.0  A Mobile Robot Tracking using Kalman Filter-ba...   \n",
       "2   3  NaN  Global and Local Path Planning on Robotic Whee...   \n",
       "3   4  2.0  Whisker sensor design for three dimensional po...   \n",
       "4   5  2.0  Applying Deep Reinforcement Learning to Cable ...   \n",
       "\n",
       "                                               预处理文本  \n",
       "0  sensor terminal portable intelligent navigatio...  \n",
       "1  mobile robot track kalman filter-based gaussia...  \n",
       "2  global local path planning robotic wheelchair ...  \n",
       "3  whisker sensor design dimensional position mea...  \n",
       "4  apply deep reinforcement learn cable drive par...  "
      ]
     },
     "execution_count": 13,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 预处理过的标题摘要\n",
    "df = pd.read_excel(r'D:\\jupyter\\DK\\DK数据\\2数据处理\\论文\\2预处理.xlsx')\n",
    "df.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "7940604c",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(21758, 4)"
      ]
     },
     "execution_count": 14,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df.shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "185066da",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10918, 79)\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>编号</th>\n",
       "      <th>标引</th>\n",
       "      <th>TI 文献标题</th>\n",
       "      <th>编号.1</th>\n",
       "      <th>PT 出版物类型</th>\n",
       "      <th>AU 作者</th>\n",
       "      <th>BA 书籍作者</th>\n",
       "      <th>BE 书籍编者</th>\n",
       "      <th>GP 团体作者</th>\n",
       "      <th>AF 作者全名</th>\n",
       "      <th>...</th>\n",
       "      <th>WC Web of Science 主题类别</th>\n",
       "      <th>WE Web of Science 索引</th>\n",
       "      <th>SC 研究方向</th>\n",
       "      <th>GA IDS 编号</th>\n",
       "      <th>PM PubMedID</th>\n",
       "      <th>OA 公开访问名称</th>\n",
       "      <th>HC 高被引状态</th>\n",
       "      <th>HP 热门论文状态</th>\n",
       "      <th>DA 导出日期</th>\n",
       "      <th>UT 入藏号</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>9857</td>\n",
       "      <td>0</td>\n",
       "      <td>Sliding Backstepping Control Design for Roboti...</td>\n",
       "      <td>9857</td>\n",
       "      <td>C</td>\n",
       "      <td>Hsiao, YY; Tu, PH; Hung, JW; Lin, JS</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>IEEE</td>\n",
       "      <td>Hsiao, Ya-Yun; Tu, Po-Hsien; Hung, Jeih-weih; ...</td>\n",
       "      <td>...</td>\n",
       "      <td>Automation &amp; Control Systems</td>\n",
       "      <td>Conference Proceedings Citation Index - Scienc...</td>\n",
       "      <td>Automation &amp; Control Systems</td>\n",
       "      <td>BB8FJ</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2023-03-29 00:00:00</td>\n",
       "      <td>WOS:000346501200114</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>15811</td>\n",
       "      <td>0</td>\n",
       "      <td>Calibration of Embedded Force Sensor for Robot...</td>\n",
       "      <td>15811</td>\n",
       "      <td>C</td>\n",
       "      <td>Nasir, K; Shauri, RLA; Jaafar, J</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>IEEE</td>\n",
       "      <td>Nasir, K.; Shauri, R. L. A.; Jaafar, J.</td>\n",
       "      <td>...</td>\n",
       "      <td>Engineering, Electrical &amp; Electronic</td>\n",
       "      <td>Conference Proceedings Citation Index - Scienc...</td>\n",
       "      <td>Engineering</td>\n",
       "      <td>BG5PA</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2023-03-29 00:00:00</td>\n",
       "      <td>WOS:000389632900068</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>1142</td>\n",
       "      <td>0</td>\n",
       "      <td>Constraint Definition for Gripper Selection an...</td>\n",
       "      <td>1142</td>\n",
       "      <td>J</td>\n",
       "      <td>Mohammed, SK; Arbo, MH; Tingelstad, L</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Mohammed, Shafi Khurieshi; Arbo, Mathias Hauan...</td>\n",
       "      <td>...</td>\n",
       "      <td>Engineering, Electrical &amp; Electronic; Engineer...</td>\n",
       "      <td>Science Citation Index Expanded (SCI-EXPANDED)</td>\n",
       "      <td>Engineering</td>\n",
       "      <td>7E6EU</td>\n",
       "      <td>NaN</td>\n",
       "      <td>gold</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2023-03-29 00:00:00</td>\n",
       "      <td>WOS:000901259500001</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>866</td>\n",
       "      <td>0</td>\n",
       "      <td>Energy-saving task assignment for robotic fish...</td>\n",
       "      <td>866</td>\n",
       "      <td>C</td>\n",
       "      <td>Yan, S; Jie, Z; Bing, G; Hao, S</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Jianping, C; Juan, W</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Yan, Shen; Jie, Zhang; Bing, Guo; Hao, Si</td>\n",
       "      <td>...</td>\n",
       "      <td>Engineering, Electrical &amp; Electronic; Instrume...</td>\n",
       "      <td>Conference Proceedings Citation Index - Scienc...</td>\n",
       "      <td>Engineering; Instruments &amp; Instrumentation</td>\n",
       "      <td>BI7SC</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2023-03-29 00:00:00</td>\n",
       "      <td>WOS:000414626500106</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>13042</td>\n",
       "      <td>0</td>\n",
       "      <td>An Interaction-Torque Controller for Robotic E...</td>\n",
       "      <td>13042</td>\n",
       "      <td>C</td>\n",
       "      <td>Vertechy, R; Frisoli, A; Solazzi, M; Pellegrin...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>IEEE; Robotics Society of Japan</td>\n",
       "      <td>Vertechy, R.; Frisoli, A.; Solazzi, M.; Pelleg...</td>\n",
       "      <td>...</td>\n",
       "      <td>Automation &amp; Control Systems; Computer Science...</td>\n",
       "      <td>Conference Proceedings Citation Index - Scienc...</td>\n",
       "      <td>Automation &amp; Control Systems; Computer Science...</td>\n",
       "      <td>BEK21</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2023-03-29 00:00:00</td>\n",
       "      <td>WOS:000317042700052</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>5 rows × 79 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "      编号  标引                                            TI 文献标题   编号.1  \\\n",
       "0   9857   0  Sliding Backstepping Control Design for Roboti...   9857   \n",
       "1  15811   0  Calibration of Embedded Force Sensor for Robot...  15811   \n",
       "2   1142   0  Constraint Definition for Gripper Selection an...   1142   \n",
       "3    866   0  Energy-saving task assignment for robotic fish...    866   \n",
       "4  13042   0  An Interaction-Torque Controller for Robotic E...  13042   \n",
       "\n",
       "  PT 出版物类型                                              AU 作者 BA 书籍作者  \\\n",
       "0        C               Hsiao, YY; Tu, PH; Hung, JW; Lin, JS     NaN   \n",
       "1        C                   Nasir, K; Shauri, RLA; Jaafar, J     NaN   \n",
       "2        J              Mohammed, SK; Arbo, MH; Tingelstad, L     NaN   \n",
       "3        C                    Yan, S; Jie, Z; Bing, G; Hao, S     NaN   \n",
       "4        C  Vertechy, R; Frisoli, A; Solazzi, M; Pellegrin...     NaN   \n",
       "\n",
       "                BE 书籍编者                          GP 团体作者  \\\n",
       "0                   NaN                             IEEE   \n",
       "1                   NaN                             IEEE   \n",
       "2                   NaN                              NaN   \n",
       "3  Jianping, C; Juan, W                              NaN   \n",
       "4                   NaN  IEEE; Robotics Society of Japan   \n",
       "\n",
       "                                             AF 作者全名  ...  \\\n",
       "0  Hsiao, Ya-Yun; Tu, Po-Hsien; Hung, Jeih-weih; ...  ...   \n",
       "1            Nasir, K.; Shauri, R. L. A.; Jaafar, J.  ...   \n",
       "2  Mohammed, Shafi Khurieshi; Arbo, Mathias Hauan...  ...   \n",
       "3          Yan, Shen; Jie, Zhang; Bing, Guo; Hao, Si  ...   \n",
       "4  Vertechy, R.; Frisoli, A.; Solazzi, M.; Pelleg...  ...   \n",
       "\n",
       "                              WC Web of Science 主题类别  \\\n",
       "0                       Automation & Control Systems   \n",
       "1               Engineering, Electrical & Electronic   \n",
       "2  Engineering, Electrical & Electronic; Engineer...   \n",
       "3  Engineering, Electrical & Electronic; Instrume...   \n",
       "4  Automation & Control Systems; Computer Science...   \n",
       "\n",
       "                                WE Web of Science 索引  \\\n",
       "0  Conference Proceedings Citation Index - Scienc...   \n",
       "1  Conference Proceedings Citation Index - Scienc...   \n",
       "2     Science Citation Index Expanded (SCI-EXPANDED)   \n",
       "3  Conference Proceedings Citation Index - Scienc...   \n",
       "4  Conference Proceedings Citation Index - Scienc...   \n",
       "\n",
       "                                             SC 研究方向  GA IDS 编号 PM PubMedID  \\\n",
       "0                       Automation & Control Systems      BB8FJ         NaN   \n",
       "1                                        Engineering      BG5PA         NaN   \n",
       "2                                        Engineering      7E6EU         NaN   \n",
       "3         Engineering; Instruments & Instrumentation      BI7SC         NaN   \n",
       "4  Automation & Control Systems; Computer Science...      BEK21         NaN   \n",
       "\n",
       "  OA 公开访问名称  HC 高被引状态 HP 热门论文状态              DA 导出日期               UT 入藏号  \n",
       "0       NaN       NaN       NaN  2023-03-29 00:00:00  WOS:000346501200114  \n",
       "1       NaN       NaN       NaN  2023-03-29 00:00:00  WOS:000389632900068  \n",
       "2      gold       NaN       NaN  2023-03-29 00:00:00  WOS:000901259500001  \n",
       "3       NaN       NaN       NaN  2023-03-29 00:00:00  WOS:000414626500106  \n",
       "4       NaN       NaN       NaN  2023-03-29 00:00:00  WOS:000317042700052  \n",
       "\n",
       "[5 rows x 79 columns]"
      ]
     },
     "execution_count": 15,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "data = pd.read_excel(r'D:\\jupyter\\DK\\DK数据\\2数据处理\\分类结果\\论文-分类为0-原始标记为2.xlsx')\n",
    "print(data.shape)\n",
    "data.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "40c418fd",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([ 9857, 15811,  1142, ..., 21754, 21757, 21758], dtype=int64)"
      ]
     },
     "execution_count": 16,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "bianhao = data['编号'].values\n",
    "bianhao"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "1abb32fc",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████████████████████████████████████████████████████████████████████| 10918/10918 [00:05<00:00, 1865.25it/s]\n"
     ]
    }
   ],
   "source": [
    "idx_ls =[]\n",
    "for i in tqdm(range(len(bianhao))):\n",
    "    ii = bianhao[i]\n",
    "    idx = df[df['编号'] == ii].index\n",
    "    idx_ls.append(idx[0])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "d62bd0c7",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "10918"
      ]
     },
     "execution_count": 18,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "len(idx_ls)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "id": "1ac4eb29",
   "metadata": {},
   "outputs": [],
   "source": [
    "df1 = df.iloc[idx_ls,[3]].reset_index(drop = True)\n",
    "df2 = data[['编号','TI 文献标题','PY 出版年']].reset_index(drop = True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "id": "da832b32",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(10918, 4)\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>编号</th>\n",
       "      <th>TI 文献标题</th>\n",
       "      <th>PY 出版年</th>\n",
       "      <th>预处理文本</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>9857</td>\n",
       "      <td>Sliding Backstepping Control Design for Roboti...</td>\n",
       "      <td>2014.0</td>\n",
       "      <td>slide backstepping control design robotic mani...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>15811</td>\n",
       "      <td>Calibration of Embedded Force Sensor for Robot...</td>\n",
       "      <td>2016.0</td>\n",
       "      <td>calibration embedded force sensor robotic hand...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>1142</td>\n",
       "      <td>Constraint Definition for Gripper Selection an...</td>\n",
       "      <td>2022.0</td>\n",
       "      <td>constraint definition gripper selection grasp ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>866</td>\n",
       "      <td>Energy-saving task assignment for robotic fish...</td>\n",
       "      <td>2015.0</td>\n",
       "      <td>energy-saving task assignment robotic fish sen...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>13042</td>\n",
       "      <td>An Interaction-Torque Controller for Robotic E...</td>\n",
       "      <td>2012.0</td>\n",
       "      <td>interaction-torque controller robotic exoskele...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "      编号                                            TI 文献标题  PY 出版年  \\\n",
       "0   9857  Sliding Backstepping Control Design for Roboti...  2014.0   \n",
       "1  15811  Calibration of Embedded Force Sensor for Robot...  2016.0   \n",
       "2   1142  Constraint Definition for Gripper Selection an...  2022.0   \n",
       "3    866  Energy-saving task assignment for robotic fish...  2015.0   \n",
       "4  13042  An Interaction-Torque Controller for Robotic E...  2012.0   \n",
       "\n",
       "                                               预处理文本  \n",
       "0  slide backstepping control design robotic mani...  \n",
       "1  calibration embedded force sensor robotic hand...  \n",
       "2  constraint definition gripper selection grasp ...  \n",
       "3  energy-saving task assignment robotic fish sen...  \n",
       "4  interaction-torque controller robotic exoskele...  "
      ]
     },
     "execution_count": 20,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "new_data = pd.concat([df2,df1],axis=1)\n",
    "print(new_data.shape)\n",
    "new_data.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "id": "e77c0d24",
   "metadata": {},
   "outputs": [],
   "source": [
    "new_data.to_excel(r'D:\\jupyter\\DK\\DK数据\\2数据处理\\3聚类\\2应用研究\\1语料-论文.xlsx',index = False)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "5cde75fd",
   "metadata": {},
   "source": [
    "### 2.抽主题"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "id": "d95d89ed",
   "metadata": {},
   "outputs": [],
   "source": [
    "new_data = pd.read_excel(r'D:\\jupyter\\DK\\DK数据\\2数据处理\\3聚类\\2应用研究\\2新语料.xlsx')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "id": "93dc5122",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>编号</th>\n",
       "      <th>TI 文献标题</th>\n",
       "      <th>PY 出版年</th>\n",
       "      <th>预处理文本</th>\n",
       "      <th>预处理文本2</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>9857</td>\n",
       "      <td>Sliding Backstepping Control Design for Roboti...</td>\n",
       "      <td>2014.0</td>\n",
       "      <td>slide backstepping control design robotic mani...</td>\n",
       "      <td>slide backstepping control design robotic mani...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>15811</td>\n",
       "      <td>Calibration of Embedded Force Sensor for Robot...</td>\n",
       "      <td>2016.0</td>\n",
       "      <td>calibration embedded force sensor robotic hand...</td>\n",
       "      <td>calibration embed force sensor robotic hand ma...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>1142</td>\n",
       "      <td>Constraint Definition for Gripper Selection an...</td>\n",
       "      <td>2022.0</td>\n",
       "      <td>constraint definition gripper selection grasp ...</td>\n",
       "      <td>constraint definition gripper selection grasp ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>866</td>\n",
       "      <td>Energy-saving task assignment for robotic fish...</td>\n",
       "      <td>2015.0</td>\n",
       "      <td>energy-saving task assignment robotic fish sen...</td>\n",
       "      <td>energy-saving task assignment robotic fish sen...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>13042</td>\n",
       "      <td>An Interaction-Torque Controller for Robotic E...</td>\n",
       "      <td>2012.0</td>\n",
       "      <td>interaction-torque controller robotic exoskele...</td>\n",
       "      <td>controller robotic exoskeleton flexible joint ...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "      编号                                            TI 文献标题  PY 出版年  \\\n",
       "0   9857  Sliding Backstepping Control Design for Roboti...  2014.0   \n",
       "1  15811  Calibration of Embedded Force Sensor for Robot...  2016.0   \n",
       "2   1142  Constraint Definition for Gripper Selection an...  2022.0   \n",
       "3    866  Energy-saving task assignment for robotic fish...  2015.0   \n",
       "4  13042  An Interaction-Torque Controller for Robotic E...  2012.0   \n",
       "\n",
       "                                               预处理文本  \\\n",
       "0  slide backstepping control design robotic mani...   \n",
       "1  calibration embedded force sensor robotic hand...   \n",
       "2  constraint definition gripper selection grasp ...   \n",
       "3  energy-saving task assignment robotic fish sen...   \n",
       "4  interaction-torque controller robotic exoskele...   \n",
       "\n",
       "                                              预处理文本2  \n",
       "0  slide backstepping control design robotic mani...  \n",
       "1  calibration embed force sensor robotic hand ma...  \n",
       "2  constraint definition gripper selection grasp ...  \n",
       "3  energy-saving task assignment robotic fish sen...  \n",
       "4  controller robotic exoskeleton flexible joint ...  "
      ]
     },
     "execution_count": 23,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "new_data.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "id": "2b56f840",
   "metadata": {},
   "outputs": [],
   "source": [
    "from bertopic import BERTopic"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "id": "77e29b20",
   "metadata": {},
   "outputs": [],
   "source": [
    "topic_model = BERTopic(language=\"english\"\n",
    "                       , calculate_probabilities=True\n",
    "                       , verbose=True\n",
    "                       , top_n_words = 100\n",
    "                       , n_gram_range = (1, 1)\n",
    "#                        ，nr_topics:  = None\n",
    "                      )"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "id": "a8c2ae27",
   "metadata": {},
   "outputs": [],
   "source": [
    "# help(BERTopic)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "id": "34adf1e8",
   "metadata": {},
   "outputs": [],
   "source": [
    "docs = new_data['预处理文本2'].values"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "id": "46e9246b",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "bc55e982217e48239646bf14247d70d2",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Batches:   0%|          | 0/943 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "2023-05-05 15:17:52,798 - BERTopic - Transformed documents to Embeddings\n",
      "2023-05-05 15:18:36,678 - BERTopic - Reduced dimensionality\n",
      "2023-05-05 15:20:56,000 - BERTopic - Clustered reduced embeddings\n"
     ]
    }
   ],
   "source": [
    "topics, probs = topic_model.fit_transform(docs)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e119fca6",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "id": "f38a9c6d",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Topic</th>\n",
       "      <th>Count</th>\n",
       "      <th>Name</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>-1</td>\n",
       "      <td>11954</td>\n",
       "      <td>-1_robot_object_method_data</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>0</td>\n",
       "      <td>1919</td>\n",
       "      <td>0_weld_welding_seam_arc</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>1</td>\n",
       "      <td>965</td>\n",
       "      <td>1_surgical_surgery_patient_bone</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>2</td>\n",
       "      <td>953</td>\n",
       "      <td>2_slide_adaptive_manipulator_controller</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>3</td>\n",
       "      <td>595</td>\n",
       "      <td>3_tactile_sensor_sense_soft</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>238</th>\n",
       "      <td>237</td>\n",
       "      <td>10</td>\n",
       "      <td>237_filter_fusion_attitude_kalman</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>239</th>\n",
       "      <td>238</td>\n",
       "      <td>10</td>\n",
       "      <td>238_micromanipulator_compliant_micro_safpm</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>240</th>\n",
       "      <td>239</td>\n",
       "      <td>10</td>\n",
       "      <td>239_navigation_mark_infinite_hunt</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>241</th>\n",
       "      <td>240</td>\n",
       "      <td>10</td>\n",
       "      <td>240_antiexception_machine_pulse_robotized</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>242</th>\n",
       "      <td>241</td>\n",
       "      <td>10</td>\n",
       "      <td>241_pneumatic_soft_multimaterial_finger</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>243 rows × 3 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     Topic  Count                                        Name\n",
       "0       -1  11954                 -1_robot_object_method_data\n",
       "1        0   1919                     0_weld_welding_seam_arc\n",
       "2        1    965             1_surgical_surgery_patient_bone\n",
       "3        2    953     2_slide_adaptive_manipulator_controller\n",
       "4        3    595                 3_tactile_sensor_sense_soft\n",
       "..     ...    ...                                         ...\n",
       "238    237     10           237_filter_fusion_attitude_kalman\n",
       "239    238     10  238_micromanipulator_compliant_micro_safpm\n",
       "240    239     10           239_navigation_mark_infinite_hunt\n",
       "241    240     10   240_antiexception_machine_pulse_robotized\n",
       "242    241     10     241_pneumatic_soft_multimaterial_finger\n",
       "\n",
       "[243 rows x 3 columns]"
      ]
     },
     "execution_count": 29,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 1.查看主题信息\n",
    "topic_model.get_topic_info()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "id": "5d66cb98",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "2023-05-05 15:28:58,171 - BERTopic - Reduced number of topics from 243 to 56\n"
     ]
    }
   ],
   "source": [
    "# 1主题缩减\n",
    "new_topic = topic_model.reduce_topics(docs, nr_topics='auto')\n",
    "topics = new_topic.topics_\n",
    "probabilities = new_topic.probabilities_"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 31,
   "id": "a17a0e48",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Topic</th>\n",
       "      <th>Count</th>\n",
       "      <th>Name</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>-1</td>\n",
       "      <td>11954</td>\n",
       "      <td>-1_robot_method_system_control</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>0</td>\n",
       "      <td>13934</td>\n",
       "      <td>0_weld_robot_method_control</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>1</td>\n",
       "      <td>965</td>\n",
       "      <td>1_surgical_surgery_patient_robotic</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>2</td>\n",
       "      <td>498</td>\n",
       "      <td>2_spray_paint_coat_gun</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>3</td>\n",
       "      <td>282</td>\n",
       "      <td>3_underwater_water_sonar_navigation</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>4</td>\n",
       "      <td>149</td>\n",
       "      <td>4_wafer_semiconductor_transfer_chamber</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>5</td>\n",
       "      <td>147</td>\n",
       "      <td>5_fish_fin_swim_model</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>6</td>\n",
       "      <td>133</td>\n",
       "      <td>6_ultrasonic_needle_ultrasound_biopsy</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>7</td>\n",
       "      <td>117</td>\n",
       "      <td>7_inspection_tank_inspect_bridge</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>8</td>\n",
       "      <td>114</td>\n",
       "      <td>8_fruit_harvest_pick_tomato</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>9</td>\n",
       "      <td>110</td>\n",
       "      <td>9_mow_grass_mower_lawn</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>10</td>\n",
       "      <td>96</td>\n",
       "      <td>10_charge_pile_battery_recharge</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>11</td>\n",
       "      <td>87</td>\n",
       "      <td>11_pipe_pipeline_pipette_inspection</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>12</td>\n",
       "      <td>77</td>\n",
       "      <td>12_sample_blood_cell_dna</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>13</td>\n",
       "      <td>76</td>\n",
       "      <td>13_print_printing_additive_printer</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>14</td>\n",
       "      <td>70</td>\n",
       "      <td>14_power_wireless_coil_wpt</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>15</td>\n",
       "      <td>68</td>\n",
       "      <td>15_aerial_flight_manipulator_fly</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>16</td>\n",
       "      <td>65</td>\n",
       "      <td>16_fire_firefighting_extinguish_flame</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>17</td>\n",
       "      <td>61</td>\n",
       "      <td>17_battery_fuel_cell_power</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>18</td>\n",
       "      <td>61</td>\n",
       "      <td>18_weed_crop_spray_pesticide</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>19</td>\n",
       "      <td>61</td>\n",
       "      <td>19_student_education_robotics_educational</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>20</td>\n",
       "      <td>58</td>\n",
       "      <td>20_substrate_transfer_mask_cassette</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>21</td>\n",
       "      <td>58</td>\n",
       "      <td>21_catheter_ablation_vascular_atrial</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>22</td>\n",
       "      <td>56</td>\n",
       "      <td>22_climb_wallclimbing_adhesion_wall</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>23</td>\n",
       "      <td>54</td>\n",
       "      <td>23_emotion_emotional_expression_facial</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>24</td>\n",
       "      <td>45</td>\n",
       "      <td>24_food_dish_cook_kitchen</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>25</td>\n",
       "      <td>42</td>\n",
       "      <td>25_glass_lcd_substrate_sheet</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>26</td>\n",
       "      <td>41</td>\n",
       "      <td>26_photovoltaic_clean_solar_panel</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>27</td>\n",
       "      <td>41</td>\n",
       "      <td>27_park_vehicle_parking_car</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>28</td>\n",
       "      <td>39</td>\n",
       "      <td>28_temperature_heat_thermal_compensation</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>29</td>\n",
       "      <td>39</td>\n",
       "      <td>29_aerial_vehicle_unmanned_flight</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>30</td>\n",
       "      <td>38</td>\n",
       "      <td>30_eeg_brain_bci_signal</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>31</td>\n",
       "      <td>35</td>\n",
       "      <td>31_meat_carcass_cut_poultry</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>32</td>\n",
       "      <td>34</td>\n",
       "      <td>32_nanowire_afm_nanomanipulation_nanomanipulator</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>33</td>\n",
       "      <td>33</td>\n",
       "      <td>33_brake_motor_release_drive</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>34</td>\n",
       "      <td>33</td>\n",
       "      <td>34_magnetic_field_geomagnetic_sensor</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td>35</td>\n",
       "      <td>31</td>\n",
       "      <td>35_cloth_garment_textile_sew</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td>36</td>\n",
       "      <td>30</td>\n",
       "      <td>36_wire_cable_harness_wear</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>38</th>\n",
       "      <td>37</td>\n",
       "      <td>27</td>\n",
       "      <td>37_spike_neuromorphic_neuron_neural</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>39</th>\n",
       "      <td>38</td>\n",
       "      <td>27</td>\n",
       "      <td>38_emg_electromyography_signal_human</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>40</th>\n",
       "      <td>39</td>\n",
       "      <td>26</td>\n",
       "      <td>39_medicine_pharmacy_medication_drug</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>41</th>\n",
       "      <td>40</td>\n",
       "      <td>26</td>\n",
       "      <td>40_shoe_glue_sole_spray</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>42</th>\n",
       "      <td>41</td>\n",
       "      <td>23</td>\n",
       "      <td>41_capsule_intestine_endoscopy_tissue</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>43</th>\n",
       "      <td>42</td>\n",
       "      <td>23</td>\n",
       "      <td>42_substation_inspection_transformer_meter</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>44</th>\n",
       "      <td>43</td>\n",
       "      <td>22</td>\n",
       "      <td>43_sterilize_disinfection_disinfect_epidemic</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>45</th>\n",
       "      <td>44</td>\n",
       "      <td>20</td>\n",
       "      <td>44_paint_painting_artwork_artistic</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>46</th>\n",
       "      <td>45</td>\n",
       "      <td>18</td>\n",
       "      <td>45_iron_steel_alloy_core</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>47</th>\n",
       "      <td>46</td>\n",
       "      <td>18</td>\n",
       "      <td>46_coal_mine_underground_laneway</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>48</th>\n",
       "      <td>47</td>\n",
       "      <td>17</td>\n",
       "      <td>47_tire_rim_wheel_sealant</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49</th>\n",
       "      <td>48</td>\n",
       "      <td>17</td>\n",
       "      <td>48_energy_consumption_power_industrial</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50</th>\n",
       "      <td>49</td>\n",
       "      <td>16</td>\n",
       "      <td>49_odor_plume_gas_source</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>51</th>\n",
       "      <td>50</td>\n",
       "      <td>15</td>\n",
       "      <td>50_chess_chessboard_chessman_game</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>52</th>\n",
       "      <td>51</td>\n",
       "      <td>13</td>\n",
       "      <td>51_brachytherapy_needle_innovative_cancer</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>53</th>\n",
       "      <td>52</td>\n",
       "      <td>12</td>\n",
       "      <td>52_carton_unloader_unload_pile</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>54</th>\n",
       "      <td>53</td>\n",
       "      <td>11</td>\n",
       "      <td>53_slosh_liquid_container_suppression</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>55</th>\n",
       "      <td>54</td>\n",
       "      <td>11</td>\n",
       "      <td>54_encrypt_encryption_key_communication</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    Topic  Count                                              Name\n",
       "0      -1  11954                    -1_robot_method_system_control\n",
       "1       0  13934                       0_weld_robot_method_control\n",
       "2       1    965                1_surgical_surgery_patient_robotic\n",
       "3       2    498                            2_spray_paint_coat_gun\n",
       "4       3    282               3_underwater_water_sonar_navigation\n",
       "5       4    149            4_wafer_semiconductor_transfer_chamber\n",
       "6       5    147                             5_fish_fin_swim_model\n",
       "7       6    133             6_ultrasonic_needle_ultrasound_biopsy\n",
       "8       7    117                  7_inspection_tank_inspect_bridge\n",
       "9       8    114                       8_fruit_harvest_pick_tomato\n",
       "10      9    110                            9_mow_grass_mower_lawn\n",
       "11     10     96                   10_charge_pile_battery_recharge\n",
       "12     11     87               11_pipe_pipeline_pipette_inspection\n",
       "13     12     77                          12_sample_blood_cell_dna\n",
       "14     13     76                13_print_printing_additive_printer\n",
       "15     14     70                        14_power_wireless_coil_wpt\n",
       "16     15     68                  15_aerial_flight_manipulator_fly\n",
       "17     16     65             16_fire_firefighting_extinguish_flame\n",
       "18     17     61                        17_battery_fuel_cell_power\n",
       "19     18     61                      18_weed_crop_spray_pesticide\n",
       "20     19     61         19_student_education_robotics_educational\n",
       "21     20     58               20_substrate_transfer_mask_cassette\n",
       "22     21     58              21_catheter_ablation_vascular_atrial\n",
       "23     22     56               22_climb_wallclimbing_adhesion_wall\n",
       "24     23     54            23_emotion_emotional_expression_facial\n",
       "25     24     45                         24_food_dish_cook_kitchen\n",
       "26     25     42                      25_glass_lcd_substrate_sheet\n",
       "27     26     41                 26_photovoltaic_clean_solar_panel\n",
       "28     27     41                       27_park_vehicle_parking_car\n",
       "29     28     39          28_temperature_heat_thermal_compensation\n",
       "30     29     39                 29_aerial_vehicle_unmanned_flight\n",
       "31     30     38                           30_eeg_brain_bci_signal\n",
       "32     31     35                       31_meat_carcass_cut_poultry\n",
       "33     32     34  32_nanowire_afm_nanomanipulation_nanomanipulator\n",
       "34     33     33                      33_brake_motor_release_drive\n",
       "35     34     33              34_magnetic_field_geomagnetic_sensor\n",
       "36     35     31                      35_cloth_garment_textile_sew\n",
       "37     36     30                        36_wire_cable_harness_wear\n",
       "38     37     27               37_spike_neuromorphic_neuron_neural\n",
       "39     38     27              38_emg_electromyography_signal_human\n",
       "40     39     26              39_medicine_pharmacy_medication_drug\n",
       "41     40     26                           40_shoe_glue_sole_spray\n",
       "42     41     23             41_capsule_intestine_endoscopy_tissue\n",
       "43     42     23        42_substation_inspection_transformer_meter\n",
       "44     43     22      43_sterilize_disinfection_disinfect_epidemic\n",
       "45     44     20                44_paint_painting_artwork_artistic\n",
       "46     45     18                          45_iron_steel_alloy_core\n",
       "47     46     18                  46_coal_mine_underground_laneway\n",
       "48     47     17                         47_tire_rim_wheel_sealant\n",
       "49     48     17            48_energy_consumption_power_industrial\n",
       "50     49     16                          49_odor_plume_gas_source\n",
       "51     50     15                 50_chess_chessboard_chessman_game\n",
       "52     51     13         51_brachytherapy_needle_innovative_cancer\n",
       "53     52     12                    52_carton_unloader_unload_pile\n",
       "54     53     11             53_slosh_liquid_container_suppression\n",
       "55     54     11           54_encrypt_encryption_key_communication"
      ]
     },
     "execution_count": 31,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 1.查看主题信息\n",
    "new_topic.get_topic_info()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "id": "c69dd93c",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "2023-05-05 15:32:26,772 - BERTopic - Reduced number of topics from 56 to 46\n"
     ]
    }
   ],
   "source": [
    "# 1主题缩减\n",
    "new_topic = new_topic.reduce_topics(docs, nr_topics='auto')\n",
    "topics = new_topic.topics_\n",
    "probabilities = new_topic.probabilities_"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "id": "55e96a11",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Topic</th>\n",
       "      <th>Count</th>\n",
       "      <th>Name</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>-1</td>\n",
       "      <td>11954</td>\n",
       "      <td>-1_robot_method_system_control</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>0</td>\n",
       "      <td>15899</td>\n",
       "      <td>0_weld_robot_method_system</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>1</td>\n",
       "      <td>227</td>\n",
       "      <td>1_charge_battery_power_pile</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>2</td>\n",
       "      <td>149</td>\n",
       "      <td>2_wafer_semiconductor_transfer_chamber</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>3</td>\n",
       "      <td>147</td>\n",
       "      <td>3_fish_fin_swim_model</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>4</td>\n",
       "      <td>133</td>\n",
       "      <td>4_ultrasonic_needle_ultrasound_biopsy</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>5</td>\n",
       "      <td>114</td>\n",
       "      <td>5_fruit_harvest_pick_tomato</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>6</td>\n",
       "      <td>110</td>\n",
       "      <td>6_mow_grass_mower_lawn</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>7</td>\n",
       "      <td>87</td>\n",
       "      <td>7_pipe_pipeline_pipette_inspection</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>8</td>\n",
       "      <td>77</td>\n",
       "      <td>8_sample_blood_cell_dna</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>9</td>\n",
       "      <td>76</td>\n",
       "      <td>9_print_printing_additive_printer</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>10</td>\n",
       "      <td>68</td>\n",
       "      <td>10_aerial_flight_manipulator_fly</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>11</td>\n",
       "      <td>65</td>\n",
       "      <td>11_fire_firefighting_extinguish_flame</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>12</td>\n",
       "      <td>61</td>\n",
       "      <td>12_student_education_robotics_educational</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>13</td>\n",
       "      <td>61</td>\n",
       "      <td>13_weed_crop_spray_pesticide</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>14</td>\n",
       "      <td>58</td>\n",
       "      <td>14_catheter_ablation_vascular_atrial</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>15</td>\n",
       "      <td>58</td>\n",
       "      <td>15_substrate_transfer_mask_cassette</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>16</td>\n",
       "      <td>56</td>\n",
       "      <td>16_climb_wallclimbing_adhesion_wall</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>17</td>\n",
       "      <td>54</td>\n",
       "      <td>17_emotion_emotional_expression_user</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>18</td>\n",
       "      <td>45</td>\n",
       "      <td>18_food_dish_cook_kitchen</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>19</td>\n",
       "      <td>42</td>\n",
       "      <td>19_glass_lcd_substrate_sheet</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>20</td>\n",
       "      <td>41</td>\n",
       "      <td>20_photovoltaic_clean_solar_panel</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>21</td>\n",
       "      <td>41</td>\n",
       "      <td>21_park_vehicle_parking_car</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>22</td>\n",
       "      <td>39</td>\n",
       "      <td>22_aerial_vehicle_unmanned_flight</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>23</td>\n",
       "      <td>39</td>\n",
       "      <td>23_temperature_heat_thermal_compensation</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>24</td>\n",
       "      <td>35</td>\n",
       "      <td>24_meat_carcass_cut_poultry</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>25</td>\n",
       "      <td>34</td>\n",
       "      <td>25_nanowire_afm_nanomanipulation_nanomanipulator</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>26</td>\n",
       "      <td>33</td>\n",
       "      <td>26_brake_motor_release_drive</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>27</td>\n",
       "      <td>33</td>\n",
       "      <td>27_magnetic_field_geomagnetic_sensor</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>28</td>\n",
       "      <td>31</td>\n",
       "      <td>28_cloth_garment_textile_sew</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>29</td>\n",
       "      <td>30</td>\n",
       "      <td>29_wire_cable_harness_wear</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>30</td>\n",
       "      <td>26</td>\n",
       "      <td>30_medicine_pharmacy_medication_drug</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>31</td>\n",
       "      <td>26</td>\n",
       "      <td>31_shoe_glue_sole_spray</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>32</td>\n",
       "      <td>23</td>\n",
       "      <td>32_capsule_intestine_endoscopy_tissue</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>33</td>\n",
       "      <td>23</td>\n",
       "      <td>33_substation_inspection_transformer_meter</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>34</td>\n",
       "      <td>22</td>\n",
       "      <td>34_sterilize_disinfection_disinfect_epidemic</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td>35</td>\n",
       "      <td>20</td>\n",
       "      <td>35_paint_painting_artwork_artistic</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td>36</td>\n",
       "      <td>18</td>\n",
       "      <td>36_coal_mine_underground_laneway</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>38</th>\n",
       "      <td>37</td>\n",
       "      <td>18</td>\n",
       "      <td>37_iron_steel_alloy_core</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>39</th>\n",
       "      <td>38</td>\n",
       "      <td>17</td>\n",
       "      <td>38_energy_consumption_industrial_power</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>40</th>\n",
       "      <td>39</td>\n",
       "      <td>17</td>\n",
       "      <td>39_tire_rim_wheel_sealant</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>41</th>\n",
       "      <td>40</td>\n",
       "      <td>16</td>\n",
       "      <td>40_odor_plume_gas_source</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>42</th>\n",
       "      <td>41</td>\n",
       "      <td>15</td>\n",
       "      <td>41_chess_chessboard_chessman_game</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>43</th>\n",
       "      <td>42</td>\n",
       "      <td>13</td>\n",
       "      <td>42_brachytherapy_needle_innovative_parallel</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>44</th>\n",
       "      <td>43</td>\n",
       "      <td>12</td>\n",
       "      <td>43_carton_unloader_unload_pile</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>45</th>\n",
       "      <td>44</td>\n",
       "      <td>11</td>\n",
       "      <td>44_slosh_liquid_container_suppression</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    Topic  Count                                              Name\n",
       "0      -1  11954                    -1_robot_method_system_control\n",
       "1       0  15899                        0_weld_robot_method_system\n",
       "2       1    227                       1_charge_battery_power_pile\n",
       "3       2    149            2_wafer_semiconductor_transfer_chamber\n",
       "4       3    147                             3_fish_fin_swim_model\n",
       "5       4    133             4_ultrasonic_needle_ultrasound_biopsy\n",
       "6       5    114                       5_fruit_harvest_pick_tomato\n",
       "7       6    110                            6_mow_grass_mower_lawn\n",
       "8       7     87                7_pipe_pipeline_pipette_inspection\n",
       "9       8     77                           8_sample_blood_cell_dna\n",
       "10      9     76                 9_print_printing_additive_printer\n",
       "11     10     68                  10_aerial_flight_manipulator_fly\n",
       "12     11     65             11_fire_firefighting_extinguish_flame\n",
       "13     12     61         12_student_education_robotics_educational\n",
       "14     13     61                      13_weed_crop_spray_pesticide\n",
       "15     14     58              14_catheter_ablation_vascular_atrial\n",
       "16     15     58               15_substrate_transfer_mask_cassette\n",
       "17     16     56               16_climb_wallclimbing_adhesion_wall\n",
       "18     17     54              17_emotion_emotional_expression_user\n",
       "19     18     45                         18_food_dish_cook_kitchen\n",
       "20     19     42                      19_glass_lcd_substrate_sheet\n",
       "21     20     41                 20_photovoltaic_clean_solar_panel\n",
       "22     21     41                       21_park_vehicle_parking_car\n",
       "23     22     39                 22_aerial_vehicle_unmanned_flight\n",
       "24     23     39          23_temperature_heat_thermal_compensation\n",
       "25     24     35                       24_meat_carcass_cut_poultry\n",
       "26     25     34  25_nanowire_afm_nanomanipulation_nanomanipulator\n",
       "27     26     33                      26_brake_motor_release_drive\n",
       "28     27     33              27_magnetic_field_geomagnetic_sensor\n",
       "29     28     31                      28_cloth_garment_textile_sew\n",
       "30     29     30                        29_wire_cable_harness_wear\n",
       "31     30     26              30_medicine_pharmacy_medication_drug\n",
       "32     31     26                           31_shoe_glue_sole_spray\n",
       "33     32     23             32_capsule_intestine_endoscopy_tissue\n",
       "34     33     23        33_substation_inspection_transformer_meter\n",
       "35     34     22      34_sterilize_disinfection_disinfect_epidemic\n",
       "36     35     20                35_paint_painting_artwork_artistic\n",
       "37     36     18                  36_coal_mine_underground_laneway\n",
       "38     37     18                          37_iron_steel_alloy_core\n",
       "39     38     17            38_energy_consumption_industrial_power\n",
       "40     39     17                         39_tire_rim_wheel_sealant\n",
       "41     40     16                          40_odor_plume_gas_source\n",
       "42     41     15                 41_chess_chessboard_chessman_game\n",
       "43     42     13       42_brachytherapy_needle_innovative_parallel\n",
       "44     43     12                    43_carton_unloader_unload_pile\n",
       "45     44     11             44_slosh_liquid_container_suppression"
      ]
     },
     "execution_count": 33,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 1.查看主题信息\n",
    "new_topic.get_topic_info()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "id": "9c38ed64",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "2023-05-05 15:32:51,142 - BERTopic - Reduced number of topics from 46 to 29\n"
     ]
    }
   ],
   "source": [
    "# 1主题缩减\n",
    "new_topic = new_topic.reduce_topics(docs, nr_topics='auto')\n",
    "topics = new_topic.topics_\n",
    "probabilities = new_topic.probabilities_"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 35,
   "id": "6fe53e71",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Topic</th>\n",
       "      <th>Count</th>\n",
       "      <th>Name</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>-1</td>\n",
       "      <td>11954</td>\n",
       "      <td>-1_robot_method_system_control</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>0</td>\n",
       "      <td>16802</td>\n",
       "      <td>0_robot_weld_method_system</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>1</td>\n",
       "      <td>149</td>\n",
       "      <td>1_wafer_semiconductor_transfer_chamber</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>2</td>\n",
       "      <td>149</td>\n",
       "      <td>2_fruit_harvest_pick_cut</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>3</td>\n",
       "      <td>110</td>\n",
       "      <td>3_mow_grass_mower_lawn</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>4</td>\n",
       "      <td>94</td>\n",
       "      <td>4_catheter_ablation_capsule_brachytherapy</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>5</td>\n",
       "      <td>87</td>\n",
       "      <td>5_pipe_pipeline_pipette_inspection</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>6</td>\n",
       "      <td>77</td>\n",
       "      <td>6_sample_cell_blood_dna</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>7</td>\n",
       "      <td>76</td>\n",
       "      <td>7_print_printing_additive_manufacturing</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>8</td>\n",
       "      <td>65</td>\n",
       "      <td>8_fire_firefighting_extinguish_flame</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>9</td>\n",
       "      <td>61</td>\n",
       "      <td>9_student_education_robotics_educational</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>10</td>\n",
       "      <td>61</td>\n",
       "      <td>10_weed_spray_crop_pesticide</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>11</td>\n",
       "      <td>54</td>\n",
       "      <td>11_emotion_emotional_expression_user</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>12</td>\n",
       "      <td>45</td>\n",
       "      <td>12_food_dish_cook_kitchen</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>13</td>\n",
       "      <td>41</td>\n",
       "      <td>13_park_vehicle_parking_car</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>14</td>\n",
       "      <td>39</td>\n",
       "      <td>14_temperature_heat_thermal_compensation</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>15</td>\n",
       "      <td>34</td>\n",
       "      <td>15_nanowire_afm_nanomanipulation_nanomanipulator</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>16</td>\n",
       "      <td>33</td>\n",
       "      <td>16_brake_motor_release_drive</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>17</td>\n",
       "      <td>33</td>\n",
       "      <td>17_magnetic_field_geomagnetic_sensor</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>18</td>\n",
       "      <td>31</td>\n",
       "      <td>18_cloth_garment_textile_sew</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>19</td>\n",
       "      <td>26</td>\n",
       "      <td>19_shoe_glue_sole_spray</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>20</td>\n",
       "      <td>26</td>\n",
       "      <td>20_medicine_pharmacy_medication_drug</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>21</td>\n",
       "      <td>23</td>\n",
       "      <td>21_substation_inspection_transformer_meter</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>22</td>\n",
       "      <td>22</td>\n",
       "      <td>22_sterilize_disinfection_disinfect_clean</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>23</td>\n",
       "      <td>20</td>\n",
       "      <td>23_paint_painting_artwork_artistic</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>24</td>\n",
       "      <td>18</td>\n",
       "      <td>24_steel_iron_alloy_core</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>25</td>\n",
       "      <td>17</td>\n",
       "      <td>25_tire_rim_wheel_test</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>26</td>\n",
       "      <td>15</td>\n",
       "      <td>26_chess_chessboard_chessman_game</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>27</td>\n",
       "      <td>12</td>\n",
       "      <td>27_carton_unloader_unload_pile</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    Topic  Count                                              Name\n",
       "0      -1  11954                    -1_robot_method_system_control\n",
       "1       0  16802                        0_robot_weld_method_system\n",
       "2       1    149            1_wafer_semiconductor_transfer_chamber\n",
       "3       2    149                          2_fruit_harvest_pick_cut\n",
       "4       3    110                            3_mow_grass_mower_lawn\n",
       "5       4     94         4_catheter_ablation_capsule_brachytherapy\n",
       "6       5     87                5_pipe_pipeline_pipette_inspection\n",
       "7       6     77                           6_sample_cell_blood_dna\n",
       "8       7     76           7_print_printing_additive_manufacturing\n",
       "9       8     65              8_fire_firefighting_extinguish_flame\n",
       "10      9     61          9_student_education_robotics_educational\n",
       "11     10     61                      10_weed_spray_crop_pesticide\n",
       "12     11     54              11_emotion_emotional_expression_user\n",
       "13     12     45                         12_food_dish_cook_kitchen\n",
       "14     13     41                       13_park_vehicle_parking_car\n",
       "15     14     39          14_temperature_heat_thermal_compensation\n",
       "16     15     34  15_nanowire_afm_nanomanipulation_nanomanipulator\n",
       "17     16     33                      16_brake_motor_release_drive\n",
       "18     17     33              17_magnetic_field_geomagnetic_sensor\n",
       "19     18     31                      18_cloth_garment_textile_sew\n",
       "20     19     26                           19_shoe_glue_sole_spray\n",
       "21     20     26              20_medicine_pharmacy_medication_drug\n",
       "22     21     23        21_substation_inspection_transformer_meter\n",
       "23     22     22         22_sterilize_disinfection_disinfect_clean\n",
       "24     23     20                23_paint_painting_artwork_artistic\n",
       "25     24     18                          24_steel_iron_alloy_core\n",
       "26     25     17                            25_tire_rim_wheel_test\n",
       "27     26     15                 26_chess_chessboard_chessman_game\n",
       "28     27     12                    27_carton_unloader_unload_pile"
      ]
     },
     "execution_count": 35,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 1.查看主题信息\n",
    "new_topic.get_topic_info()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "80a62a19",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "5cdf5345",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "c2113bd5",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 36,
   "id": "47bffb3a",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('robot', 0.023856756900371867),\n",
       " ('weld', 0.021385741032468958),\n",
       " ('method', 0.019484256009176373),\n",
       " ('system', 0.01877302147330145),\n",
       " ('control', 0.018258118179762344),\n",
       " ('position', 0.013717359768671906),\n",
       " ('base', 0.013571603098277617),\n",
       " ('process', 0.013223833299694999),\n",
       " ('robotic', 0.013164398559341412),\n",
       " ('sensor', 0.012724186323946526),\n",
       " ('manipulator', 0.012335679043470703),\n",
       " ('involve', 0.01206881423618904),\n",
       " ('model', 0.012024221450638202),\n",
       " ('data', 0.011618257295119214),\n",
       " ('coordinate', 0.011594875662675499),\n",
       " ('advantage', 0.009977806099203596),\n",
       " ('accord', 0.00965135092431263),\n",
       " ('design', 0.009551803854633827),\n",
       " ('perform', 0.009288091521078769),\n",
       " ('determine', 0.009264890075119152),\n",
       " ('joint', 0.009103486785317845),\n",
       " ('industrial', 0.009083174914905715),\n",
       " ('device', 0.009029211787879955),\n",
       " ('image', 0.008968382914948829),\n",
       " ('draw', 0.008951769543891442),\n",
       " ('track', 0.008871073856182866),\n",
       " ('force', 0.008848547898902116),\n",
       " ('arm', 0.008780915755736805),\n",
       " ('parameter', 0.008598643239297338),\n",
       " ('propose', 0.008517677352051133),\n",
       " ('target', 0.008455736421425048),\n",
       " ('operation', 0.008320292434189355),\n",
       " ('controller', 0.008275027219133353),\n",
       " ('improve', 0.008047082523380423),\n",
       " ('result', 0.008039405375432074),\n",
       " ('parallel', 0.00792831374788244),\n",
       " ('time', 0.007887569534055509),\n",
       " ('surface', 0.007763207809597696),\n",
       " ('claim', 0.007712182302069691),\n",
       " ('path', 0.007626545085521697),\n",
       " ('unit', 0.007573537271909017),\n",
       " ('text', 0.007456127286669599),\n",
       " ('language', 0.007438499661284133),\n",
       " ('provide', 0.0074258462741472585),\n",
       " ('storage', 0.0073922845012142045),\n",
       " ('motion', 0.0073895104426430665),\n",
       " ('laser', 0.007327123905572157),\n",
       " ('paper', 0.007262400910915717),\n",
       " ('set', 0.00717225573514579),\n",
       " ('move', 0.007133305763612967),\n",
       " ('object', 0.007098713800458994),\n",
       " ('spray', 0.00708710192904729),\n",
       " ('dynamic', 0.006942731231705007),\n",
       " ('nonenglish', 0.006866571710150333),\n",
       " ('independent', 0.006824099442631505),\n",
       " ('step', 0.006792134904064769),\n",
       " ('tool', 0.006700417247931942),\n",
       " ('algorithm', 0.006650819373758477),\n",
       " ('enable', 0.006625203693615504),\n",
       " ('task', 0.006456403810042909),\n",
       " ('workpiece', 0.006346907300530763),\n",
       " ('calibration', 0.006334268975433459),\n",
       " ('trajectory', 0.006289767330307212),\n",
       " ('space', 0.0062741427983073065),\n",
       " ('module', 0.006256399447589563),\n",
       " ('generate', 0.006255164589684764),\n",
       " ('calculate', 0.0062515552964579075),\n",
       " ('signal', 0.006198578090307949),\n",
       " ('surgical', 0.006194657209001123),\n",
       " ('clean', 0.006171515673596217),\n",
       " ('assembly', 0.006158151489495459),\n",
       " ('movement', 0.006079526736311283),\n",
       " ('network', 0.00603872157573126),\n",
       " ('performance', 0.006034588262548605),\n",
       " ('reduce', 0.006030633287719681),\n",
       " ('error', 0.006018368188851717),\n",
       " ('program', 0.005947013178319923),\n",
       " ('application', 0.0058852374805821225),\n",
       " ('illustrate', 0.005807266142349633),\n",
       " ('structure', 0.005721546251436242),\n",
       " ('angle', 0.005677001351422363),\n",
       " ('polish', 0.005666621180290594),\n",
       " ('processing', 0.00565552607240145),\n",
       " ('detect', 0.005636568059429286),\n",
       " ('welding', 0.0056320103847760095),\n",
       " ('detailed', 0.005582703526710208),\n",
       " ('store', 0.005575056881206126),\n",
       " ('environment', 0.005564146553893747),\n",
       " ('mechanical', 0.0054402483324976735),\n",
       " ('measure', 0.005411958617198567),\n",
       " ('simulation', 0.0053657068071711255),\n",
       " ('analysis', 0.005362935920770812),\n",
       " ('current', 0.005360460446013974),\n",
       " ('speed', 0.005339529757288325),\n",
       " ('mechanism', 0.00532313678257949),\n",
       " ('realize', 0.005294923834331811),\n",
       " ('mode', 0.005263911908536471),\n",
       " ('flow', 0.005243516163120713),\n",
       " ('user', 0.0051664078155428065),\n",
       " ('detection', 0.0050947268988103065)]"
      ]
     },
     "execution_count": 36,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 2查看具体主题关键词   默认前十个\n",
    "new_topic.get_topic(0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 37,
   "id": "533b6bd9",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['advantage', 'enable', 'step', 'robotic', 'path', 'position', 'unit', 'claim', 'task', 'data', 'operation', 'image', 'improve', 'provide', 'device', 'robot', 'control', 'independent', 'detect', 'generate', 'accord', 'method', 'controller', 'system', 'coordinate', 'base', 'sensor', 'set', 'reduce', 'module', 'speed', 'detection', 'detailed', 'process', 'draw', 'involve', 'signal', 'perform', 'current', 'tool', 'environment', 'mode', 'determine', 'time']\n"
     ]
    }
   ],
   "source": [
    "# 查看关键词交集\n",
    "ls1,ls2 = [],[]\n",
    "for item in new_topic.get_topic(0):\n",
    "    ls1.append(item[0])\n",
    "\n",
    "for item in new_topic.get_topic(3):\n",
    "    ls2.append(item[0])\n",
    "\n",
    "set1 = set(ls1)\n",
    "set2 = set(ls2)\n",
    "\n",
    "set3 = set1 & set2\n",
    "list3 = list(set3)\n",
    "print(list3)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 38,
   "id": "29730ddb",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Document</th>\n",
       "      <th>Topic</th>\n",
       "      <th>Name</th>\n",
       "      <th>Top_n_words</th>\n",
       "      <th>Probability</th>\n",
       "      <th>Representative_document</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>slide backstepping control design robotic mani...</td>\n",
       "      <td>0</td>\n",
       "      <td>0_robot_weld_method_system</td>\n",
       "      <td>robot - weld - method - system - control - pos...</td>\n",
       "      <td>0.910798</td>\n",
       "      <td>False</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>calibration embed force sensor robotic hand ma...</td>\n",
       "      <td>0</td>\n",
       "      <td>0_robot_weld_method_system</td>\n",
       "      <td>robot - weld - method - system - control - pos...</td>\n",
       "      <td>0.846442</td>\n",
       "      <td>False</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>constraint definition gripper selection grasp ...</td>\n",
       "      <td>-1</td>\n",
       "      <td>-1_robot_method_system_control</td>\n",
       "      <td>robot - method - system - control - position -...</td>\n",
       "      <td>0.879925</td>\n",
       "      <td>False</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>energy-saving task assignment robotic fish sen...</td>\n",
       "      <td>0</td>\n",
       "      <td>0_robot_weld_method_system</td>\n",
       "      <td>robot - weld - method - system - control - pos...</td>\n",
       "      <td>0.218918</td>\n",
       "      <td>False</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>controller robotic exoskeleton flexible joint ...</td>\n",
       "      <td>0</td>\n",
       "      <td>0_robot_weld_method_system</td>\n",
       "      <td>robot - weld - method - system - control - pos...</td>\n",
       "      <td>0.926832</td>\n",
       "      <td>False</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30169</th>\n",
       "      <td>multi-sensor fusion simultaneous localization ...</td>\n",
       "      <td>-1</td>\n",
       "      <td>-1_robot_method_system_control</td>\n",
       "      <td>robot - method - system - control - position -...</td>\n",
       "      <td>0.314525</td>\n",
       "      <td>False</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30170</th>\n",
       "      <td>autonomous move object robotic vacuum clean de...</td>\n",
       "      <td>-1</td>\n",
       "      <td>-1_robot_method_system_control</td>\n",
       "      <td>robot - method - system - control - position -...</td>\n",
       "      <td>0.792036</td>\n",
       "      <td>False</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30171</th>\n",
       "      <td>vision sensor base robot locate device obstacl...</td>\n",
       "      <td>-1</td>\n",
       "      <td>-1_robot_method_system_control</td>\n",
       "      <td>robot - method - system - control - position -...</td>\n",
       "      <td>0.180671</td>\n",
       "      <td>False</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30172</th>\n",
       "      <td>fusion imu optical distance measure sensor int...</td>\n",
       "      <td>0</td>\n",
       "      <td>0_robot_weld_method_system</td>\n",
       "      <td>robot - weld - method - system - control - pos...</td>\n",
       "      <td>0.680124</td>\n",
       "      <td>False</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30173</th>\n",
       "      <td>collision detection boundary tune system robot...</td>\n",
       "      <td>0</td>\n",
       "      <td>0_robot_weld_method_system</td>\n",
       "      <td>robot - weld - method - system - control - pos...</td>\n",
       "      <td>0.790034</td>\n",
       "      <td>False</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>30174 rows × 6 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                Document  Topic  \\\n",
       "0      slide backstepping control design robotic mani...      0   \n",
       "1      calibration embed force sensor robotic hand ma...      0   \n",
       "2      constraint definition gripper selection grasp ...     -1   \n",
       "3      energy-saving task assignment robotic fish sen...      0   \n",
       "4      controller robotic exoskeleton flexible joint ...      0   \n",
       "...                                                  ...    ...   \n",
       "30169  multi-sensor fusion simultaneous localization ...     -1   \n",
       "30170  autonomous move object robotic vacuum clean de...     -1   \n",
       "30171  vision sensor base robot locate device obstacl...     -1   \n",
       "30172  fusion imu optical distance measure sensor int...      0   \n",
       "30173  collision detection boundary tune system robot...      0   \n",
       "\n",
       "                                 Name  \\\n",
       "0          0_robot_weld_method_system   \n",
       "1          0_robot_weld_method_system   \n",
       "2      -1_robot_method_system_control   \n",
       "3          0_robot_weld_method_system   \n",
       "4          0_robot_weld_method_system   \n",
       "...                               ...   \n",
       "30169  -1_robot_method_system_control   \n",
       "30170  -1_robot_method_system_control   \n",
       "30171  -1_robot_method_system_control   \n",
       "30172      0_robot_weld_method_system   \n",
       "30173      0_robot_weld_method_system   \n",
       "\n",
       "                                             Top_n_words  Probability  \\\n",
       "0      robot - weld - method - system - control - pos...     0.910798   \n",
       "1      robot - weld - method - system - control - pos...     0.846442   \n",
       "2      robot - method - system - control - position -...     0.879925   \n",
       "3      robot - weld - method - system - control - pos...     0.218918   \n",
       "4      robot - weld - method - system - control - pos...     0.926832   \n",
       "...                                                  ...          ...   \n",
       "30169  robot - method - system - control - position -...     0.314525   \n",
       "30170  robot - method - system - control - position -...     0.792036   \n",
       "30171  robot - method - system - control - position -...     0.180671   \n",
       "30172  robot - weld - method - system - control - pos...     0.680124   \n",
       "30173  robot - weld - method - system - control - pos...     0.790034   \n",
       "\n",
       "       Representative_document  \n",
       "0                        False  \n",
       "1                        False  \n",
       "2                        False  \n",
       "3                        False  \n",
       "4                        False  \n",
       "...                        ...  \n",
       "30169                    False  \n",
       "30170                    False  \n",
       "30171                    False  \n",
       "30172                    False  \n",
       "30173                    False  \n",
       "\n",
       "[30174 rows x 6 columns]"
      ]
     },
     "execution_count": 38,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 3查看文档属于当前主题的概率\n",
    "new_topic.get_document_info(docs)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 39,
   "id": "6ecee708",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>编号</th>\n",
       "      <th>TI 文献标题</th>\n",
       "      <th>PY 出版年</th>\n",
       "      <th>预处理文本</th>\n",
       "      <th>预处理文本2</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>9857</td>\n",
       "      <td>Sliding Backstepping Control Design for Roboti...</td>\n",
       "      <td>2014.0</td>\n",
       "      <td>slide backstepping control design robotic mani...</td>\n",
       "      <td>slide backstepping control design robotic mani...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>15811</td>\n",
       "      <td>Calibration of Embedded Force Sensor for Robot...</td>\n",
       "      <td>2016.0</td>\n",
       "      <td>calibration embedded force sensor robotic hand...</td>\n",
       "      <td>calibration embed force sensor robotic hand ma...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>1142</td>\n",
       "      <td>Constraint Definition for Gripper Selection an...</td>\n",
       "      <td>2022.0</td>\n",
       "      <td>constraint definition gripper selection grasp ...</td>\n",
       "      <td>constraint definition gripper selection grasp ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>866</td>\n",
       "      <td>Energy-saving task assignment for robotic fish...</td>\n",
       "      <td>2015.0</td>\n",
       "      <td>energy-saving task assignment robotic fish sen...</td>\n",
       "      <td>energy-saving task assignment robotic fish sen...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>13042</td>\n",
       "      <td>An Interaction-Torque Controller for Robotic E...</td>\n",
       "      <td>2012.0</td>\n",
       "      <td>interaction-torque controller robotic exoskele...</td>\n",
       "      <td>controller robotic exoskeleton flexible joint ...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "      编号                                            TI 文献标题  PY 出版年  \\\n",
       "0   9857  Sliding Backstepping Control Design for Roboti...  2014.0   \n",
       "1  15811  Calibration of Embedded Force Sensor for Robot...  2016.0   \n",
       "2   1142  Constraint Definition for Gripper Selection an...  2022.0   \n",
       "3    866  Energy-saving task assignment for robotic fish...  2015.0   \n",
       "4  13042  An Interaction-Torque Controller for Robotic E...  2012.0   \n",
       "\n",
       "                                               预处理文本  \\\n",
       "0  slide backstepping control design robotic mani...   \n",
       "1  calibration embedded force sensor robotic hand...   \n",
       "2  constraint definition gripper selection grasp ...   \n",
       "3  energy-saving task assignment robotic fish sen...   \n",
       "4  interaction-torque controller robotic exoskele...   \n",
       "\n",
       "                                              预处理文本2  \n",
       "0  slide backstepping control design robotic mani...  \n",
       "1  calibration embed force sensor robotic hand ma...  \n",
       "2  constraint definition gripper selection grasp ...  \n",
       "3  energy-saving task assignment robotic fish sen...  \n",
       "4  controller robotic exoskeleton flexible joint ...  "
      ]
     },
     "execution_count": 39,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 保存表格\n",
    "new_data.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 40,
   "id": "90a004ac",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Document</th>\n",
       "      <th>Topic</th>\n",
       "      <th>Probability</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>slide backstepping control design robotic mani...</td>\n",
       "      <td>0</td>\n",
       "      <td>0.910798</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>calibration embed force sensor robotic hand ma...</td>\n",
       "      <td>0</td>\n",
       "      <td>0.846442</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>constraint definition gripper selection grasp ...</td>\n",
       "      <td>-1</td>\n",
       "      <td>0.879925</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>energy-saving task assignment robotic fish sen...</td>\n",
       "      <td>0</td>\n",
       "      <td>0.218918</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>controller robotic exoskeleton flexible joint ...</td>\n",
       "      <td>0</td>\n",
       "      <td>0.926832</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                            Document  Topic  Probability\n",
       "0  slide backstepping control design robotic mani...      0     0.910798\n",
       "1  calibration embed force sensor robotic hand ma...      0     0.846442\n",
       "2  constraint definition gripper selection grasp ...     -1     0.879925\n",
       "3  energy-saving task assignment robotic fish sen...      0     0.218918\n",
       "4  controller robotic exoskeleton flexible joint ...      0     0.926832"
      ]
     },
     "execution_count": 40,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "need_data = new_topic.get_document_info(docs).iloc[:,[0,1,4]]\n",
    "need_data.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 41,
   "id": "3d167ff4",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>编号</th>\n",
       "      <th>TI 文献标题</th>\n",
       "      <th>PY 出版年</th>\n",
       "      <th>预处理文本</th>\n",
       "      <th>预处理文本2</th>\n",
       "      <th>Document</th>\n",
       "      <th>Topic</th>\n",
       "      <th>Probability</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>9857</td>\n",
       "      <td>Sliding Backstepping Control Design for Roboti...</td>\n",
       "      <td>2014.0</td>\n",
       "      <td>slide backstepping control design robotic mani...</td>\n",
       "      <td>slide backstepping control design robotic mani...</td>\n",
       "      <td>slide backstepping control design robotic mani...</td>\n",
       "      <td>0</td>\n",
       "      <td>0.910798</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>15811</td>\n",
       "      <td>Calibration of Embedded Force Sensor for Robot...</td>\n",
       "      <td>2016.0</td>\n",
       "      <td>calibration embedded force sensor robotic hand...</td>\n",
       "      <td>calibration embed force sensor robotic hand ma...</td>\n",
       "      <td>calibration embed force sensor robotic hand ma...</td>\n",
       "      <td>0</td>\n",
       "      <td>0.846442</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>1142</td>\n",
       "      <td>Constraint Definition for Gripper Selection an...</td>\n",
       "      <td>2022.0</td>\n",
       "      <td>constraint definition gripper selection grasp ...</td>\n",
       "      <td>constraint definition gripper selection grasp ...</td>\n",
       "      <td>constraint definition gripper selection grasp ...</td>\n",
       "      <td>-1</td>\n",
       "      <td>0.879925</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>866</td>\n",
       "      <td>Energy-saving task assignment for robotic fish...</td>\n",
       "      <td>2015.0</td>\n",
       "      <td>energy-saving task assignment robotic fish sen...</td>\n",
       "      <td>energy-saving task assignment robotic fish sen...</td>\n",
       "      <td>energy-saving task assignment robotic fish sen...</td>\n",
       "      <td>0</td>\n",
       "      <td>0.218918</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>13042</td>\n",
       "      <td>An Interaction-Torque Controller for Robotic E...</td>\n",
       "      <td>2012.0</td>\n",
       "      <td>interaction-torque controller robotic exoskele...</td>\n",
       "      <td>controller robotic exoskeleton flexible joint ...</td>\n",
       "      <td>controller robotic exoskeleton flexible joint ...</td>\n",
       "      <td>0</td>\n",
       "      <td>0.926832</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "      编号                                            TI 文献标题  PY 出版年  \\\n",
       "0   9857  Sliding Backstepping Control Design for Roboti...  2014.0   \n",
       "1  15811  Calibration of Embedded Force Sensor for Robot...  2016.0   \n",
       "2   1142  Constraint Definition for Gripper Selection an...  2022.0   \n",
       "3    866  Energy-saving task assignment for robotic fish...  2015.0   \n",
       "4  13042  An Interaction-Torque Controller for Robotic E...  2012.0   \n",
       "\n",
       "                                               预处理文本  \\\n",
       "0  slide backstepping control design robotic mani...   \n",
       "1  calibration embedded force sensor robotic hand...   \n",
       "2  constraint definition gripper selection grasp ...   \n",
       "3  energy-saving task assignment robotic fish sen...   \n",
       "4  interaction-torque controller robotic exoskele...   \n",
       "\n",
       "                                              预处理文本2  \\\n",
       "0  slide backstepping control design robotic mani...   \n",
       "1  calibration embed force sensor robotic hand ma...   \n",
       "2  constraint definition gripper selection grasp ...   \n",
       "3  energy-saving task assignment robotic fish sen...   \n",
       "4  controller robotic exoskeleton flexible joint ...   \n",
       "\n",
       "                                            Document  Topic  Probability  \n",
       "0  slide backstepping control design robotic mani...      0     0.910798  \n",
       "1  calibration embed force sensor robotic hand ma...      0     0.846442  \n",
       "2  constraint definition gripper selection grasp ...     -1     0.879925  \n",
       "3  energy-saving task assignment robotic fish sen...      0     0.218918  \n",
       "4  controller robotic exoskeleton flexible joint ...      0     0.926832  "
      ]
     },
     "execution_count": 41,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "save_data = pd.concat([new_data, need_data],axis=1)\n",
    "save_data.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 42,
   "id": "0e494c02",
   "metadata": {},
   "outputs": [],
   "source": [
    "# save_data.to_excel(r'D:\\jupyter\\DK\\DK数据\\2数据处理\\3聚类\\2应用研究\\4文档属于主题的概率.xlsx',index = False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "f3f0e8e2",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 43,
   "id": "c6411765",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{-1: [('robot', 0.027924716780815685),\n",
       "  ('method', 0.02182208319930399),\n",
       "  ('system', 0.019354451705335705),\n",
       "  ('control', 0.01771060224182882),\n",
       "  ('position', 0.01663738552905588),\n",
       "  ('data', 0.015452631064019742),\n",
       "  ('process', 0.015033634491049499),\n",
       "  ('base', 0.014536337733339288),\n",
       "  ('involve', 0.014320918044287487),\n",
       "  ('sensor', 0.014249235575067246),\n",
       "  ('image', 0.013769665599162133),\n",
       "  ('object', 0.013255140287525918),\n",
       "  ('arm', 0.012357931097915505),\n",
       "  ('industrial', 0.01204877397768712),\n",
       "  ('target', 0.011861895601685834),\n",
       "  ('advantage', 0.011687432610853386),\n",
       "  ('model', 0.011620626300869371),\n",
       "  ('determine', 0.011613186796642777),\n",
       "  ('device', 0.011426451103378057),\n",
       "  ('coordinate', 0.011231134088700665),\n",
       "  ('draw', 0.011190617744104854),\n",
       "  ('accord', 0.010920364377207104),\n",
       "  ('robotic', 0.010835113915064467),\n",
       "  ('mobile', 0.0104518973120526),\n",
       "  ('operation', 0.010301943617859327),\n",
       "  ('perform', 0.010217969604749503),\n",
       "  ('claim', 0.010007829717664486),\n",
       "  ('assembly', 0.009985621467895783),\n",
       "  ('unit', 0.009435348843396361),\n",
       "  ('task', 0.009169359634611105),\n",
       "  ('move', 0.00907029051166646),\n",
       "  ('module', 0.008942247685773248),\n",
       "  ('map', 0.008823351275958399),\n",
       "  ('independent', 0.00882264915717405),\n",
       "  ('language', 0.008811976876057073),\n",
       "  ('environment', 0.00874662740818692),\n",
       "  ('path', 0.008657957445660077),\n",
       "  ('set', 0.008637524303974667),\n",
       "  ('step', 0.008541155515840037),\n",
       "  ('text', 0.008482059562674761),\n",
       "  ('motion', 0.008400710735556918),\n",
       "  ('enable', 0.008397713222750985),\n",
       "  ('nonenglish', 0.008375667932871337),\n",
       "  ('camera', 0.008308366575528844),\n",
       "  ('processing', 0.008274315992463487),\n",
       "  ('provide', 0.008271232892439315),\n",
       "  ('time', 0.008270584909474655),\n",
       "  ('joint', 0.00819726867998358),\n",
       "  ('store', 0.007988148936282332),\n",
       "  ('improve', 0.007864685362590487),\n",
       "  ('detect', 0.007817604456022594),\n",
       "  ('movement', 0.007777223606016826),\n",
       "  ('manipulator', 0.007535254965161717),\n",
       "  ('generate', 0.007369350208306982),\n",
       "  ('storage', 0.007002478985201882),\n",
       "  ('instruction', 0.006972299559591628),\n",
       "  ('detailed', 0.00695969951221793),\n",
       "  ('mechanical', 0.0069435184491947344),\n",
       "  ('force', 0.006917980755271089),\n",
       "  ('calculate', 0.006871499833861624),\n",
       "  ('program', 0.006860121594572084),\n",
       "  ('parameter', 0.006796707653522956),\n",
       "  ('detection', 0.006770301177465442),\n",
       "  ('diagram', 0.006737817319558328),\n",
       "  ('signal', 0.006736720063112948),\n",
       "  ('space', 0.006725987029589371),\n",
       "  ('pose', 0.006704232004301266),\n",
       "  ('user', 0.006690488862747377),\n",
       "  ('illustrate', 0.006684709845010226),\n",
       "  ('result', 0.006584650463312395),\n",
       "  ('track', 0.006569008721919069),\n",
       "  ('computer', 0.006562561278972255),\n",
       "  ('current', 0.006561473903249636),\n",
       "  ('drive', 0.006557434815512576),\n",
       "  ('controller', 0.006343827553783268),\n",
       "  ('location', 0.006206675252847946),\n",
       "  ('design', 0.0061710876761221535),\n",
       "  ('reduce', 0.006163938378070011),\n",
       "  ('receive', 0.006123319915674893),\n",
       "  ('distance', 0.005970634145334859),\n",
       "  ('tool', 0.005923819440985537),\n",
       "  ('view', 0.0059103572842738854),\n",
       "  ('application', 0.005898084882575815),\n",
       "  ('obstacle', 0.005859566450637484),\n",
       "  ('machine', 0.00583327897938622),\n",
       "  ('component', 0.005807111559321266),\n",
       "  ('flow', 0.005761714849088192),\n",
       "  ('realize', 0.005715998422768404),\n",
       "  ('workpiece', 0.00571511551478124),\n",
       "  ('algorithm', 0.005661887721293762),\n",
       "  ('plan', 0.00561421019091812),\n",
       "  ('vision', 0.005564373712653018),\n",
       "  ('comprise', 0.005539592051909754),\n",
       "  ('operate', 0.0054599739270633435),\n",
       "  ('intelligent', 0.005448610644655827),\n",
       "  ('network', 0.005416033517974105),\n",
       "  ('vehicle', 0.0054055409930162356),\n",
       "  ('collect', 0.0053837928421390825),\n",
       "  ('multiple', 0.0053654651535949395),\n",
       "  ('measure', 0.005345772493694635)],\n",
       " 0: [('robot', 0.023856756900371867),\n",
       "  ('weld', 0.021385741032468958),\n",
       "  ('method', 0.019484256009176373),\n",
       "  ('system', 0.01877302147330145),\n",
       "  ('control', 0.018258118179762344),\n",
       "  ('position', 0.013717359768671906),\n",
       "  ('base', 0.013571603098277617),\n",
       "  ('process', 0.013223833299694999),\n",
       "  ('robotic', 0.013164398559341412),\n",
       "  ('sensor', 0.012724186323946526),\n",
       "  ('manipulator', 0.012335679043470703),\n",
       "  ('involve', 0.01206881423618904),\n",
       "  ('model', 0.012024221450638202),\n",
       "  ('data', 0.011618257295119214),\n",
       "  ('coordinate', 0.011594875662675499),\n",
       "  ('advantage', 0.009977806099203596),\n",
       "  ('accord', 0.00965135092431263),\n",
       "  ('design', 0.009551803854633827),\n",
       "  ('perform', 0.009288091521078769),\n",
       "  ('determine', 0.009264890075119152),\n",
       "  ('joint', 0.009103486785317845),\n",
       "  ('industrial', 0.009083174914905715),\n",
       "  ('device', 0.009029211787879955),\n",
       "  ('image', 0.008968382914948829),\n",
       "  ('draw', 0.008951769543891442),\n",
       "  ('track', 0.008871073856182866),\n",
       "  ('force', 0.008848547898902116),\n",
       "  ('arm', 0.008780915755736805),\n",
       "  ('parameter', 0.008598643239297338),\n",
       "  ('propose', 0.008517677352051133),\n",
       "  ('target', 0.008455736421425048),\n",
       "  ('operation', 0.008320292434189355),\n",
       "  ('controller', 0.008275027219133353),\n",
       "  ('improve', 0.008047082523380423),\n",
       "  ('result', 0.008039405375432074),\n",
       "  ('parallel', 0.00792831374788244),\n",
       "  ('time', 0.007887569534055509),\n",
       "  ('surface', 0.007763207809597696),\n",
       "  ('claim', 0.007712182302069691),\n",
       "  ('path', 0.007626545085521697),\n",
       "  ('unit', 0.007573537271909017),\n",
       "  ('text', 0.007456127286669599),\n",
       "  ('language', 0.007438499661284133),\n",
       "  ('provide', 0.0074258462741472585),\n",
       "  ('storage', 0.0073922845012142045),\n",
       "  ('motion', 0.0073895104426430665),\n",
       "  ('laser', 0.007327123905572157),\n",
       "  ('paper', 0.007262400910915717),\n",
       "  ('set', 0.00717225573514579),\n",
       "  ('move', 0.007133305763612967),\n",
       "  ('object', 0.007098713800458994),\n",
       "  ('spray', 0.00708710192904729),\n",
       "  ('dynamic', 0.006942731231705007),\n",
       "  ('nonenglish', 0.006866571710150333),\n",
       "  ('independent', 0.006824099442631505),\n",
       "  ('step', 0.006792134904064769),\n",
       "  ('tool', 0.006700417247931942),\n",
       "  ('algorithm', 0.006650819373758477),\n",
       "  ('enable', 0.006625203693615504),\n",
       "  ('task', 0.006456403810042909),\n",
       "  ('workpiece', 0.006346907300530763),\n",
       "  ('calibration', 0.006334268975433459),\n",
       "  ('trajectory', 0.006289767330307212),\n",
       "  ('space', 0.0062741427983073065),\n",
       "  ('module', 0.006256399447589563),\n",
       "  ('generate', 0.006255164589684764),\n",
       "  ('calculate', 0.0062515552964579075),\n",
       "  ('signal', 0.006198578090307949),\n",
       "  ('surgical', 0.006194657209001123),\n",
       "  ('clean', 0.006171515673596217),\n",
       "  ('assembly', 0.006158151489495459),\n",
       "  ('movement', 0.006079526736311283),\n",
       "  ('network', 0.00603872157573126),\n",
       "  ('performance', 0.006034588262548605),\n",
       "  ('reduce', 0.006030633287719681),\n",
       "  ('error', 0.006018368188851717),\n",
       "  ('program', 0.005947013178319923),\n",
       "  ('application', 0.0058852374805821225),\n",
       "  ('illustrate', 0.005807266142349633),\n",
       "  ('structure', 0.005721546251436242),\n",
       "  ('angle', 0.005677001351422363),\n",
       "  ('polish', 0.005666621180290594),\n",
       "  ('processing', 0.00565552607240145),\n",
       "  ('detect', 0.005636568059429286),\n",
       "  ('welding', 0.0056320103847760095),\n",
       "  ('detailed', 0.005582703526710208),\n",
       "  ('store', 0.005575056881206126),\n",
       "  ('environment', 0.005564146553893747),\n",
       "  ('mechanical', 0.0054402483324976735),\n",
       "  ('measure', 0.005411958617198567),\n",
       "  ('simulation', 0.0053657068071711255),\n",
       "  ('analysis', 0.005362935920770812),\n",
       "  ('current', 0.005360460446013974),\n",
       "  ('speed', 0.005339529757288325),\n",
       "  ('mechanism', 0.00532313678257949),\n",
       "  ('realize', 0.005294923834331811),\n",
       "  ('mode', 0.005263911908536471),\n",
       "  ('flow', 0.005243516163120713),\n",
       "  ('user', 0.0051664078155428065),\n",
       "  ('detection', 0.0050947268988103065)],\n",
       " 1: [('wafer', 0.3449703523863214),\n",
       "  ('semiconductor', 0.09062157489473412),\n",
       "  ('transfer', 0.08166377390384202),\n",
       "  ('chamber', 0.044410172981332485),\n",
       "  ('position', 0.035359141545083815),\n",
       "  ('cassette', 0.03283739645097932),\n",
       "  ('process', 0.03151175318553651),\n",
       "  ('arm', 0.030823460992226572),\n",
       "  ('substrate', 0.028661934899516548),\n",
       "  ('robot', 0.025617343440437344),\n",
       "  ('vacuum', 0.024770224192613457),\n",
       "  ('method', 0.023431646441102176),\n",
       "  ('effector', 0.022366681681669956),\n",
       "  ('processing', 0.021292065791647594),\n",
       "  ('load', 0.02096810465305149),\n",
       "  ('silicon', 0.020631088950421567),\n",
       "  ('alignment', 0.01956555560175465),\n",
       "  ('center', 0.018750378920023677),\n",
       "  ('system', 0.01851416593424216),\n",
       "  ('carrier', 0.01799202111574269),\n",
       "  ('involve', 0.017241549569283945),\n",
       "  ('module', 0.0167907908704788),\n",
       "  ('pod', 0.016551656197699348),\n",
       "  ('hand', 0.016360341375860798),\n",
       "  ('align', 0.014544312218967053),\n",
       "  ('calibration', 0.014319475794836747),\n",
       "  ('equipment', 0.014226795539215282),\n",
       "  ('sensor', 0.013990743983309075),\n",
       "  ('advantage', 0.013848363583066738),\n",
       "  ('handle', 0.013817278346513327),\n",
       "  ('location', 0.01350462971335834),\n",
       "  ('pedestal', 0.013291085825405185),\n",
       "  ('move', 0.013098425562716568),\n",
       "  ('device', 0.012517865776765552),\n",
       "  ('claim', 0.01241189303591274),\n",
       "  ('schedule', 0.012126323047007425),\n",
       "  ('apparatus', 0.012009616268804145),\n",
       "  ('step', 0.011999438306278734),\n",
       "  ('mechanical', 0.01178990699708135),\n",
       "  ('draw', 0.01173412143065008),\n",
       "  ('provide', 0.011638880784482523),\n",
       "  ('solar', 0.011291983704448278),\n",
       "  ('chip', 0.011282402386162915),\n",
       "  ('independent', 0.010967124280760092),\n",
       "  ('fabrication', 0.010895913742027337),\n",
       "  ('tool', 0.010748641548855372),\n",
       "  ('seal', 0.010722816129084075),\n",
       "  ('unload', 0.010689094208939825),\n",
       "  ('clean', 0.010683163990526118),\n",
       "  ('manufacturing', 0.010625584557614524),\n",
       "  ('transport', 0.01059048969822574),\n",
       "  ('support', 0.01033340973430465),\n",
       "  ('cell', 0.010327466824908087),\n",
       "  ('calibrate', 0.010302975295353648),\n",
       "  ('detailed', 0.010258760746122949),\n",
       "  ('view', 0.010062472446301861),\n",
       "  ('eg', 0.01005622709093686),\n",
       "  ('manufacture', 0.0097960970121169),\n",
       "  ('boat', 0.009731167278291306),\n",
       "  ('circuit', 0.009647151614908069),\n",
       "  ('determine', 0.009597538411868172),\n",
       "  ('coat', 0.009374549479130743),\n",
       "  ('unit', 0.009299926094115452),\n",
       "  ('station', 0.009254435331655467),\n",
       "  ('chemical', 0.009213885089992319),\n",
       "  ('front', 0.009119068580619736),\n",
       "  ('damage', 0.008897793870635348),\n",
       "  ('plate', 0.008866314434044991),\n",
       "  ('film', 0.00876529967636582),\n",
       "  ('arrange', 0.008736591747371942),\n",
       "  ('detect', 0.008596963423269674),\n",
       "  ('portion', 0.00819487209580135),\n",
       "  ('gripper', 0.00802404449888827),\n",
       "  ('blade', 0.008020899630974259),\n",
       "  ('cluster', 0.008015701342681855),\n",
       "  ('remove', 0.007974434500931677),\n",
       "  ('lot', 0.007972862884268338),\n",
       "  ('stage', 0.007956418387511903),\n",
       "  ('rotate', 0.007897772859478248),\n",
       "  ('aligner', 0.007813279571263593),\n",
       "  ('amorphous', 0.007813279571263593),\n",
       "  ('magnetic', 0.007761995757004883),\n",
       "  ('time', 0.007611097907665974),\n",
       "  ('edge', 0.007516911492999067),\n",
       "  ('fluid', 0.007461152481702118),\n",
       "  ('prevent', 0.007412430436580375),\n",
       "  ('improve', 0.007400934316645833),\n",
       "  ('reduce', 0.007393070966270446),\n",
       "  ('control', 0.00737443633941507),\n",
       "  ('bond', 0.0073495978457340716),\n",
       "  ('port', 0.007312675837231089),\n",
       "  ('waferlike', 0.007230873291765883),\n",
       "  ('spin', 0.007201770378297599),\n",
       "  ('measure', 0.007184715915500247),\n",
       "  ('correct', 0.0071044871103892425),\n",
       "  ('finger', 0.00704946705156008),\n",
       "  ('cavity', 0.00701658173745007),\n",
       "  ('container', 0.006873018736395555),\n",
       "  ('base', 0.006869710314677349),\n",
       "  ('robotic', 0.006850810836459794)],\n",
       " 2: [('fruit', 0.13071003938352796),\n",
       "  ('harvest', 0.06713562137860277),\n",
       "  ('pick', 0.051667852149751795),\n",
       "  ('cut', 0.05122978665825265),\n",
       "  ('meat', 0.04443150218148142),\n",
       "  ('carcass', 0.030719415066457628),\n",
       "  ('image', 0.029337053107221896),\n",
       "  ('tomato', 0.02621451429153058),\n",
       "  ('stem', 0.02564729447517015),\n",
       "  ('strawberry', 0.02542228213288225),\n",
       "  ('apple', 0.023796864419463246),\n",
       "  ('seedling', 0.023435009942144657),\n",
       "  ('vision', 0.021464823437036967),\n",
       "  ('crop', 0.020433543992079268),\n",
       "  ('graft', 0.02035031076609889),\n",
       "  ('grape', 0.020142670703433743),\n",
       "  ('plant', 0.01988589896826524),\n",
       "  ('agricultural', 0.019833487676410078),\n",
       "  ('endeffector', 0.018468364648929488),\n",
       "  ('robotic', 0.018140709219998885),\n",
       "  ('segmentation', 0.01769829406894395),\n",
       "  ('machine', 0.017169733332644894),\n",
       "  ('orchard', 0.016976514929652277),\n",
       "  ('method', 0.016608661807029617),\n",
       "  ('target', 0.016126488644251747),\n",
       "  ('robot', 0.015498021525253796),\n",
       "  ('flower', 0.014980766049234607),\n",
       "  ('vegetable', 0.0148782364468336),\n",
       "  ('branch', 0.014479725442335022),\n",
       "  ('poultry', 0.01404256903699156),\n",
       "  ('cluster', 0.013876805443095067),\n",
       "  ('color', 0.013752772669948551),\n",
       "  ('process', 0.013655504087776006),\n",
       "  ('cherry', 0.013494556403296493),\n",
       "  ('rootstock', 0.013359603704236986),\n",
       "  ('tree', 0.01322941605028945),\n",
       "  ('system', 0.013219192695414057),\n",
       "  ('base', 0.013053605822163016),\n",
       "  ('sort', 0.012895664746741805),\n",
       "  ('food', 0.011791056788596843),\n",
       "  ('design', 0.011228560661725095),\n",
       "  ('peduncle', 0.011200341839532156),\n",
       "  ('develop', 0.011198211715939314),\n",
       "  ('rate', 0.010946250872355326),\n",
       "  ('pineapple', 0.010888729689067978),\n",
       "  ('detection', 0.010810111895374157),\n",
       "  ('harvesting', 0.01073471204484453),\n",
       "  ('processing', 0.010687042731454656),\n",
       "  ('depth', 0.010042865067958321),\n",
       "  ('camera', 0.010036348198353993),\n",
       "  ('bird', 0.009983809896598729),\n",
       "  ('perform', 0.009908649014197727),\n",
       "  ('pig', 0.009893418170778838),\n",
       "  ('algorithm', 0.009800079310287917),\n",
       "  ('study', 0.009743915576194508),\n",
       "  ('determine', 0.009649173714790727),\n",
       "  ('bone', 0.009613209958384645),\n",
       "  ('control', 0.0095324287199846),\n",
       "  ('pedicel', 0.009517350997069742),\n",
       "  ('dragon', 0.00942165165787268),\n",
       "  ('path', 0.009418736254678813),\n",
       "  ('string', 0.009415396552647603),\n",
       "  ('involve', 0.009349195089463446),\n",
       "  ('automate', 0.009300494907108148),\n",
       "  ('seed', 0.008914823957290154),\n",
       "  ('automatic', 0.008881409310169992),\n",
       "  ('position', 0.008817148567169692),\n",
       "  ('arm', 0.008668215535411916),\n",
       "  ('result', 0.008446204426060408),\n",
       "  ('locate', 0.008315113444254035),\n",
       "  ('scion', 0.008292167816422958),\n",
       "  ('scale', 0.008288304380128602),\n",
       "  ('knife', 0.00828527001552639),\n",
       "  ('identify', 0.0082696900015936),\n",
       "  ('lotus', 0.00813323908928896),\n",
       "  ('pasture', 0.007970241056732181),\n",
       "  ('frame', 0.007932789060459083),\n",
       "  ('provide', 0.007884916887961786),\n",
       "  ('model', 0.007862217688353174),\n",
       "  ('pork', 0.007840745657864306),\n",
       "  ('debone', 0.007840745657864306),\n",
       "  ('enable', 0.007754819564743371),\n",
       "  ('improve', 0.007716520866295592),\n",
       "  ('feature', 0.007714071113143768),\n",
       "  ('operation', 0.00768953629870054),\n",
       "  ('field', 0.007681564751158085),\n",
       "  ('cultivation', 0.007676865436566669),\n",
       "  ('mechanism', 0.007574170711669402),\n",
       "  ('damage', 0.007547904428708063),\n",
       "  ('recognition', 0.007524035519022291),\n",
       "  ('classification', 0.007492574272032991),\n",
       "  ('reduce', 0.007479012854880966),\n",
       "  ('realize', 0.007407382755464527),\n",
       "  ('success', 0.007383899260354979),\n",
       "  ('size', 0.007332291056941666),\n",
       "  ('module', 0.007297137099320759),\n",
       "  ('grip', 0.0072844208830411695),\n",
       "  ('harvester', 0.007284205652390414),\n",
       "  ('propose', 0.007251200617724523),\n",
       "  ('force', 0.007204722748924072)],\n",
       " 3: [('mow', 0.16477699018091888),\n",
       "  ('grass', 0.11960878991537545),\n",
       "  ('mower', 0.11138993296104152),\n",
       "  ('lawn', 0.10904268930713588),\n",
       "  ('cut', 0.07758619668530398),\n",
       "  ('boundary', 0.06312121424059937),\n",
       "  ('lawnmower', 0.0442285779398415),\n",
       "  ('obstacle', 0.032826332518604194),\n",
       "  ('robotic', 0.02994349199262305),\n",
       "  ('robot', 0.02709363058198558),\n",
       "  ('signal', 0.026981951174732125),\n",
       "  ('sensor', 0.02238320738003363),\n",
       "  ('garden', 0.021834091546759183),\n",
       "  ('method', 0.02136970681710079),\n",
       "  ('autonomous', 0.01947068419333061),\n",
       "  ('control', 0.01914662647913857),\n",
       "  ('path', 0.01914493676791372),\n",
       "  ('vehicle', 0.019100803098251667),\n",
       "  ('position', 0.018548175638611965),\n",
       "  ('base', 0.018330990637972094),\n",
       "  ('station', 0.017835858598840012),\n",
       "  ('perimeter', 0.017767666805618917),\n",
       "  ('detect', 0.01735771529587613),\n",
       "  ('wire', 0.01705224650789176),\n",
       "  ('turf', 0.016927567330731304),\n",
       "  ('operation', 0.016923642141440636),\n",
       "  ('avoidance', 0.016879018642247813),\n",
       "  ('determine', 0.016210474192991573),\n",
       "  ('claim', 0.01612387545385097),\n",
       "  ('distance', 0.01547727930825832),\n",
       "  ('mowing', 0.014630112101318002),\n",
       "  ('system', 0.014285627410722817),\n",
       "  ('uwb', 0.01416863926596728),\n",
       "  ('draw', 0.014088072482165093),\n",
       "  ('blade', 0.013759836364289364),\n",
       "  ('advantage', 0.013587447990763302),\n",
       "  ('direction', 0.013503665393069342),\n",
       "  ('involve', 0.013436877818163197),\n",
       "  ('accord', 0.013087673876090037),\n",
       "  ('task', 0.012589177573129346),\n",
       "  ('device', 0.01240121758668463),\n",
       "  ('unit', 0.012343858484499192),\n",
       "  ('tool', 0.012331879341644193),\n",
       "  ('set', 0.012302207498543874),\n",
       "  ('independent', 0.012239146713944549),\n",
       "  ('generate', 0.012178411127421122),\n",
       "  ('maintenance', 0.01180790348439379),\n",
       "  ('route', 0.011694358065545772),\n",
       "  ('provide', 0.011574213689164581),\n",
       "  ('operate', 0.011414319996056582),\n",
       "  ('comprise', 0.011303819577788102),\n",
       "  ('coordinate', 0.011160480141119096),\n",
       "  ('perform', 0.011138477949133356),\n",
       "  ('detection', 0.011124283207038762),\n",
       "  ('guide', 0.011036865065962999),\n",
       "  ('current', 0.010988986070408671),\n",
       "  ('avoid', 0.010757173606380076),\n",
       "  ('drive', 0.010682961572543042),\n",
       "  ('height', 0.01066315018992282),\n",
       "  ('travel', 0.010519369516465649),\n",
       "  ('navigation', 0.010466478435851469),\n",
       "  ('improve', 0.010420537589402257),\n",
       "  ('detailed', 0.010330593952402631),\n",
       "  ('motor', 0.010128816437407335),\n",
       "  ('controller', 0.010096497660247844),\n",
       "  ('data', 0.010078948527906549),\n",
       "  ('parcel', 0.009984076721667736),\n",
       "  ('location', 0.009975921109376312),\n",
       "  ('eg', 0.009809640260431924),\n",
       "  ('receive', 0.009807054507122926),\n",
       "  ('step', 0.009644291870620594),\n",
       "  ('view', 0.009611879096431073),\n",
       "  ('map', 0.009522111889045188),\n",
       "  ('preset', 0.00949712026159225),\n",
       "  ('charge', 0.009406165319373175),\n",
       "  ('time', 0.00923149714135341),\n",
       "  ('condition', 0.009174754582345427),\n",
       "  ('grassland', 0.0090302932155399),\n",
       "  ('image', 0.008931110063588979),\n",
       "  ('yard', 0.00887083206988772),\n",
       "  ('coverage', 0.008719797377149117),\n",
       "  ('enable', 0.008550900663455187),\n",
       "  ('circuitry', 0.00842841753296911),\n",
       "  ('configure', 0.008414632087800968),\n",
       "  ('environment', 0.00840614775697308),\n",
       "  ('efficiency', 0.00834995245765794),\n",
       "  ('mobile', 0.008205187627304641),\n",
       "  ('mode', 0.008112588724503505),\n",
       "  ('schematic', 0.008102798858682597),\n",
       "  ('green', 0.008085229442155306),\n",
       "  ('module', 0.007855790795447523),\n",
       "  ('field', 0.007678960186622718),\n",
       "  ('processor', 0.00766512812035454),\n",
       "  ('process', 0.007656740200802821),\n",
       "  ('speed', 0.007623903171452293),\n",
       "  ('reduce', 0.007450516979518444),\n",
       "  ('machine', 0.007387703070058137),\n",
       "  ('virtual', 0.007297078197314893),\n",
       "  ('rain', 0.007088317392042699),\n",
       "  ('reference', 0.007080580486468598)],\n",
       " 4: [('catheter', 0.15143023885513707),\n",
       "  ('ablation', 0.0504764460627682),\n",
       "  ('capsule', 0.04672757276306399),\n",
       "  ('brachytherapy', 0.036942341920455465),\n",
       "  ('robotic', 0.03332455717485878),\n",
       "  ('patient', 0.0315428790990917),\n",
       "  ('model', 0.02796504711301851),\n",
       "  ('vascular', 0.027878254420355776),\n",
       "  ('atrial', 0.026441003736113605),\n",
       "  ('system', 0.022906799694559946),\n",
       "  ('force', 0.022613725772423376),\n",
       "  ('medical', 0.022056966355847866),\n",
       "  ('design', 0.020383885003531613),\n",
       "  ('study', 0.019641369825358024),\n",
       "  ('result', 0.019514607023790095),\n",
       "  ('navigation', 0.019283339315406576),\n",
       "  ('catheterization', 0.01923896350222478),\n",
       "  ('interventional', 0.019203755269733183),\n",
       "  ('procedure', 0.01905462190097257),\n",
       "  ('fibrillation', 0.01877519120382679),\n",
       "  ('tissue', 0.01868653435025008),\n",
       "  ('magnetic', 0.018087379324823915),\n",
       "  ('pressure', 0.017765992378363883),\n",
       "  ('lesion', 0.017207295782990913),\n",
       "  ('cardiac', 0.016688244574836867),\n",
       "  ('pvi', 0.016673736581672607),\n",
       "  ('surgery', 0.016033221295714505),\n",
       "  ('endoscopy', 0.015902907140942217),\n",
       "  ('intervention', 0.01579499703227814),\n",
       "  ('treatment', 0.015424885751554531),\n",
       "  ('intestine', 0.01536501971623677),\n",
       "  ('control', 0.015256404689432242),\n",
       "  ('inside', 0.015101701022006859),\n",
       "  ('vein', 0.015086427137624583),\n",
       "  ('pulse', 0.014930044836920594),\n",
       "  ('experimental', 0.014883249798154157),\n",
       "  ('pulmonary', 0.01469362789864705),\n",
       "  ('endoscopic', 0.014547887759957539),\n",
       "  ('complication', 0.014454128457712366),\n",
       "  ('paper', 0.013992193439550112),\n",
       "  ('develop', 0.013484660105047267),\n",
       "  ('feedback', 0.013409224138358107),\n",
       "  ('artery', 0.013400830437400358),\n",
       "  ('needle', 0.013381440536590366),\n",
       "  ('propose', 0.013334497962303982),\n",
       "  ('manipulator', 0.01325226080781111),\n",
       "  ('device', 0.013218446293741986),\n",
       "  ('guide', 0.012754435406797564),\n",
       "  ('parallel', 0.012606178628129575),\n",
       "  ('surgeon', 0.012474617164478584),\n",
       "  ('master', 0.012448653953373759),\n",
       "  ('hysteresis', 0.012374874173555784),\n",
       "  ('approach', 0.012192279128641069),\n",
       "  ('persistent', 0.0121719513873072),\n",
       "  ('heart', 0.012114388252253385),\n",
       "  ('conduit', 0.012102646798613581),\n",
       "  ('vessel', 0.011841759353716749),\n",
       "  ('simulation', 0.011702572518978722),\n",
       "  ('wire', 0.011480468234032797),\n",
       "  ('invasive', 0.011424136263142575),\n",
       "  ('innovative', 0.011404564130210787),\n",
       "  ('tonometry', 0.011371616802709697),\n",
       "  ('isolation', 0.01119183067524656),\n",
       "  ('clinical', 0.011103849838968406),\n",
       "  ('cancer', 0.011092192436970325),\n",
       "  ('sensor', 0.011032350458163523),\n",
       "  ('locomotion', 0.010988074181428139),\n",
       "  ('test', 0.010849363788592806),\n",
       "  ('mri', 0.010740387420656508),\n",
       "  ('robot', 0.010731141535160256),\n",
       "  ('minimally', 0.010519229737668676),\n",
       "  ('soft', 0.010442676648839404),\n",
       "  ('accuracy', 0.01029958379159652),\n",
       "  ('friction', 0.010107055064671158),\n",
       "  ('dress', 0.010010649022337649),\n",
       "  ('structure', 0.009789485996219056),\n",
       "  ('endovascular', 0.009704222978675854),\n",
       "  ('endoscope', 0.009634427931092213),\n",
       "  ('proximal', 0.009410014326419223),\n",
       "  ('actuation', 0.009396046468425467),\n",
       "  ('resistance', 0.009381412908154384),\n",
       "  ('motion', 0.009365061506491839),\n",
       "  ('achieve', 0.009196784958113392),\n",
       "  ('intestinal', 0.009119410972539236),\n",
       "  ('colon', 0.009119410972539236),\n",
       "  ('localization', 0.009100467416264935),\n",
       "  ('success', 0.009063228458558647),\n",
       "  ('embolization', 0.008997436068233682),\n",
       "  ('xray', 0.008975551985400336),\n",
       "  ('surgical', 0.008844912538012029),\n",
       "  ('safety', 0.008750679595168249),\n",
       "  ('kinematic', 0.008729068764163307),\n",
       "  ('mechanism', 0.008650473810255823),\n",
       "  ('delivery', 0.008552068128622244),\n",
       "  ('rate', 0.008516310418095864),\n",
       "  ('perform', 0.008481637250656017),\n",
       "  ('provide', 0.008480688507896322),\n",
       "  ('fluid', 0.00835622529180846),\n",
       "  ('followup', 0.008336581992278628),\n",
       "  ('insertion', 0.008324855174725306)],\n",
       " 5: [('pipe', 0.18976739550900676),\n",
       "  ('pipeline', 0.13975839833486536),\n",
       "  ('pipette', 0.055627237525260186),\n",
       "  ('inspection', 0.03542920408591114),\n",
       "  ('robot', 0.03137183314243455),\n",
       "  ('inpipe', 0.025817011326838203),\n",
       "  ('bend', 0.024496956830458726),\n",
       "  ('method', 0.020992487555701274),\n",
       "  ('cut', 0.020435444900811825),\n",
       "  ('diameter', 0.020432090880793858),\n",
       "  ('position', 0.020408179936099953),\n",
       "  ('mechanism', 0.018452937118471912),\n",
       "  ('wall', 0.018012675249871175),\n",
       "  ('water', 0.017283341721714647),\n",
       "  ('process', 0.016502069255548302),\n",
       "  ('detection', 0.016453731237866434),\n",
       "  ('system', 0.015466164374046765),\n",
       "  ('measure', 0.014099679357876089),\n",
       "  ('involve', 0.013439553742115869),\n",
       "  ('drive', 0.013365490758926301),\n",
       "  ('gallery', 0.013100016587612505),\n",
       "  ('design', 0.013094103474386875),\n",
       "  ('culvert', 0.012956325367557737),\n",
       "  ('sensor', 0.012619620325098859),\n",
       "  ('assembly', 0.012460550734014043),\n",
       "  ('control', 0.012357127951132658),\n",
       "  ('gas', 0.012247761873582645),\n",
       "  ('move', 0.012234280040677586),\n",
       "  ('determine', 0.011676928581078194),\n",
       "  ('sample', 0.01132130679052976),\n",
       "  ('detect', 0.011277997736753007),\n",
       "  ('wheel', 0.01117235492023824),\n",
       "  ('joint', 0.01085700453250883),\n",
       "  ('power', 0.01072174526539473),\n",
       "  ('front', 0.010598663257717232),\n",
       "  ('advantage', 0.010458619365300558),\n",
       "  ('perform', 0.010370251905058548),\n",
       "  ('ring', 0.01028644093193457),\n",
       "  ('sewer', 0.010259998224323595),\n",
       "  ('repair', 0.010201260192250426),\n",
       "  ('underground', 0.010032356610970477),\n",
       "  ('metal', 0.010015222260792545),\n",
       "  ('measurement', 0.009787678461586718),\n",
       "  ('locate', 0.009779769725709781),\n",
       "  ('draw', 0.00975399328136116),\n",
       "  ('monitor', 0.009690190507638093),\n",
       "  ('operation', 0.00962748493469411),\n",
       "  ('form', 0.009542020575910234),\n",
       "  ('fluid', 0.009469666615508566),\n",
       "  ('press', 0.009352979628754551),\n",
       "  ('manipulator', 0.009208949786071802),\n",
       "  ('deck', 0.00905852190880682),\n",
       "  ('model', 0.008986372677567517),\n",
       "  ('speed', 0.008983929772349096),\n",
       "  ('device', 0.0089718370308537),\n",
       "  ('tube', 0.008935416340821093),\n",
       "  ('node', 0.008927519837683813),\n",
       "  ('camera', 0.008846656257649679),\n",
       "  ('scan', 0.008838624322076587),\n",
       "  ('realize', 0.008822778287047578),\n",
       "  ('maintenance', 0.008636470191109616),\n",
       "  ('result', 0.008585772437594017),\n",
       "  ('defect', 0.008572888393865611),\n",
       "  ('base', 0.008534372577463527),\n",
       "  ('component', 0.008345247108312945),\n",
       "  ('scraper', 0.008151452241859043),\n",
       "  ('track', 0.008148424355308567),\n",
       "  ('coordinate', 0.007948925915793985),\n",
       "  ('flexible', 0.007937107037611751),\n",
       "  ('paper', 0.0077489316754043094),\n",
       "  ('unit', 0.007728077687636189),\n",
       "  ('inspect', 0.007707292444033894),\n",
       "  ('elbow', 0.007698337211420343),\n",
       "  ('ultrasonic', 0.0074403752558457594),\n",
       "  ('connect', 0.007327944434261469),\n",
       "  ('processing', 0.007305560562254588),\n",
       "  ('branch', 0.007298674436970612),\n",
       "  ('enable', 0.0072966268100673306),\n",
       "  ('error', 0.007214400967806577),\n",
       "  ('linear', 0.007132089079184811),\n",
       "  ('sewage', 0.007094291476172542),\n",
       "  ('fill', 0.007077423660562192),\n",
       "  ('accord', 0.007056027354951829),\n",
       "  ('angle', 0.0070101181661132534),\n",
       "  ('infrasonic', 0.0069713659829831465),\n",
       "  ('direction', 0.0069137423637033145),\n",
       "  ('brush', 0.006906563296747125),\n",
       "  ('initial', 0.006894758862378399),\n",
       "  ('propose', 0.0068376827197010005),\n",
       "  ('clean', 0.006813311930978821),\n",
       "  ('image', 0.006777688351916252),\n",
       "  ('data', 0.006770918598657988),\n",
       "  ('travel', 0.0067582590025050075),\n",
       "  ('nonenglish', 0.00674658809485519),\n",
       "  ('navigation', 0.006634621625962734),\n",
       "  ('movement', 0.006592171848938568),\n",
       "  ('pressure', 0.006590938100916021),\n",
       "  ('squeegee', 0.006587844853251482),\n",
       "  ('language', 0.006498219148649496),\n",
       "  ('handle', 0.006458579581146)],\n",
       " 6: [('sample', 0.08134474012933869),\n",
       "  ('cell', 0.07105560869667997),\n",
       "  ('blood', 0.06964825422621737),\n",
       "  ('dna', 0.062220367530625285),\n",
       "  ('protein', 0.05543119719080238),\n",
       "  ('liquid', 0.04710711229074869),\n",
       "  ('automate', 0.04022582383614525),\n",
       "  ('highthroughput', 0.038810890520392494),\n",
       "  ('handle', 0.029905799418257457),\n",
       "  ('assay', 0.0282081582508128),\n",
       "  ('molecular', 0.02613794667699903),\n",
       "  ('culture', 0.025577910772130147),\n",
       "  ('protocol', 0.022569439596099868),\n",
       "  ('screen', 0.021244277263006817),\n",
       "  ('extraction', 0.019976831804565658),\n",
       "  ('cap', 0.018765906980723206),\n",
       "  ('throughput', 0.018744821317393967),\n",
       "  ('laboratory', 0.018498224015157272),\n",
       "  ('tube', 0.01816443284659167),\n",
       "  ('preparation', 0.01791034407966688),\n",
       "  ('robotic', 0.01769126657679802),\n",
       "  ('automation', 0.01760506702141731),\n",
       "  ('process', 0.01743095382926694),\n",
       "  ('vessel', 0.01711699926144467),\n",
       "  ('biological', 0.016844715548753057),\n",
       "  ('conformational', 0.016464451642663788),\n",
       "  ('yeast', 0.01636390742448677),\n",
       "  ('method', 0.01630497403849239),\n",
       "  ('liquidhandling', 0.016091285661288743),\n",
       "  ('ethanol', 0.01592948376860972),\n",
       "  ('acid', 0.015167274670954424),\n",
       "  ('biology', 0.015082665275264138),\n",
       "  ('scnt', 0.01482976478679337),\n",
       "  ('analysis', 0.014682457574694245),\n",
       "  ('somatic', 0.014635068126812258),\n",
       "  ('tissue', 0.014394003210962038),\n",
       "  ('gene', 0.014354077175334233),\n",
       "  ('development', 0.014260950202005492),\n",
       "  ('require', 0.013908986789895314),\n",
       "  ('reaction', 0.013537566722445429),\n",
       "  ('formulation', 0.013496234323324731),\n",
       "  ('system', 0.013441959917910912),\n",
       "  ('reagent', 0.012981323884961234),\n",
       "  ('develop', 0.012836047403458721),\n",
       "  ('stem', 0.012714369010195375),\n",
       "  ('plate', 0.012687496238591556),\n",
       "  ('assembly', 0.01266526529969995),\n",
       "  ('manual', 0.012558376404850073),\n",
       "  ('test', 0.012415323256230619),\n",
       "  ('lipase', 0.012328064010542482),\n",
       "  ('synthetic', 0.011736069748909107),\n",
       "  ('microfluidic', 0.011387181579146253),\n",
       "  ('clone', 0.011076959381277167),\n",
       "  ('nucleic', 0.01104716342263104),\n",
       "  ('demonstrate', 0.010925666279300918),\n",
       "  ('transfer', 0.010828283818216388),\n",
       "  ('bead', 0.010761338806397876),\n",
       "  ('volume', 0.010754726629055918),\n",
       "  ('prepare', 0.01055354466141008),\n",
       "  ('pcr', 0.01026880864300709),\n",
       "  ('incubation', 0.01019546329092044),\n",
       "  ('strain', 0.010191434721209047),\n",
       "  ('clinical', 0.010137074211544927),\n",
       "  ('approach', 0.010087230903278626),\n",
       "  ('antibody', 0.010061609337183426),\n",
       "  ('reproducibility', 0.009925951239332605),\n",
       "  ('complex', 0.009858471842713622),\n",
       "  ('workflow', 0.009774275506852418),\n",
       "  ('preanalytical', 0.00975419500185036),\n",
       "  ('expression', 0.009684584476948942),\n",
       "  ('centrifugation', 0.009655721936476656),\n",
       "  ('enzyme', 0.009483126161955756),\n",
       "  ('genome', 0.009483126161955756),\n",
       "  ('nuclear', 0.009426443600739697),\n",
       "  ('perform', 0.00941928184472473),\n",
       "  ('study', 0.009339198154598074),\n",
       "  ('transition', 0.009247755113758003),\n",
       "  ('swab', 0.0091261688458512),\n",
       "  ('chamber', 0.009049707825190333),\n",
       "  ('plasma', 0.008985047279354246),\n",
       "  ('detection', 0.00895931240517293),\n",
       "  ('experiment', 0.00889768350431558),\n",
       "  ('casework', 0.008876747512011587),\n",
       "  ('design', 0.008789111963164908),\n",
       "  ('spectrometry', 0.008778775501665325),\n",
       "  ('enable', 0.008740878766683152),\n",
       "  ('provide', 0.008683207762292599),\n",
       "  ('solubility', 0.008609241407506176),\n",
       "  ('collect', 0.008601006529646958),\n",
       "  ('increase', 0.008577485622481042),\n",
       "  ('time', 0.008569030412928471),\n",
       "  ('snp', 0.00853481354576018),\n",
       "  ('platform', 0.008501567121213806),\n",
       "  ('purification', 0.00840175252609671),\n",
       "  ('rna', 0.00834174269257127),\n",
       "  ('pipetting', 0.00834174269257127),\n",
       "  ('rapid', 0.00823714631118673),\n",
       "  ('needle', 0.008059405875290242),\n",
       "  ('injection', 0.008040401254702845),\n",
       "  ('technology', 0.007990128350739938)],\n",
       " 7: [('print', 0.1682271278956582),\n",
       "  ('printing', 0.10456522812932956),\n",
       "  ('additive', 0.049450462265991826),\n",
       "  ('manufacturing', 0.039405703815607776),\n",
       "  ('printer', 0.038642006272061005),\n",
       "  ('material', 0.029608889381731316),\n",
       "  ('stamp', 0.029181141211541993),\n",
       "  ('deposition', 0.028734578288264295),\n",
       "  ('layer', 0.02460642934054687),\n",
       "  ('process', 0.023625696037046603),\n",
       "  ('design', 0.02244241803717555),\n",
       "  ('surface', 0.022201865181851913),\n",
       "  ('fuse', 0.021479875306858586),\n",
       "  ('dry', 0.01934938717341547),\n",
       "  ('threedimensional', 0.019264086239520754),\n",
       "  ('paper', 0.018810293875291793),\n",
       "  ('technology', 0.01850838481352497),\n",
       "  ('extruder', 0.017842726768033335),\n",
       "  ('control', 0.017725943978759207),\n",
       "  ('model', 0.017588111574265472),\n",
       "  ('robotic', 0.01748553873476373),\n",
       "  ('construction', 0.01735592651100095),\n",
       "  ('impeller', 0.016775712344396905),\n",
       "  ('method', 0.016509681810475973),\n",
       "  ('slice', 0.016343217189152968),\n",
       "  ('robot', 0.01622945137248619),\n",
       "  ('concrete', 0.0155341131181589),\n",
       "  ('dimensional', 0.01529841727911478),\n",
       "  ('nozzle', 0.014762472041622916),\n",
       "  ('fourfooted', 0.01435733625735553),\n",
       "  ('system', 0.014304384369825495),\n",
       "  ('mechanism', 0.014267397881742718),\n",
       "  ('processing', 0.01400054534402852),\n",
       "  ('fiber', 0.013714065821802105),\n",
       "  ('build', 0.01326661735149871),\n",
       "  ('laser', 0.013140050692442755),\n",
       "  ('document', 0.012887662692256309),\n",
       "  ('arm', 0.012846645255797127),\n",
       "  ('manufacture', 0.012843760071717837),\n",
       "  ('carbon', 0.012835968362197608),\n",
       "  ('film', 0.012454678417188893),\n",
       "  ('magnetic', 0.012381027858114416),\n",
       "  ('structure', 0.012359112481629462),\n",
       "  ('mechanical', 0.012311840911796462),\n",
       "  ('unit', 0.012218470227148585),\n",
       "  ('printhead', 0.011901426942404097),\n",
       "  ('transfer', 0.01188940872609427),\n",
       "  ('path', 0.011724010683307898),\n",
       "  ('fabrication', 0.011545210857829271),\n",
       "  ('industrial', 0.011067425964328132),\n",
       "  ('fdm', 0.010814373932002564),\n",
       "  ('form', 0.01056556168814405),\n",
       "  ('sheet', 0.01056158127005999),\n",
       "  ('conformal', 0.010293170826386817),\n",
       "  ('curve', 0.010287982667224952),\n",
       "  ('continuous', 0.010162400064606785),\n",
       "  ('device', 0.010070675449536114),\n",
       "  ('extrude', 0.010043617393605106),\n",
       "  ('fill', 0.01001600381947763),\n",
       "  ('extrusion', 0.009655129178935535),\n",
       "  ('involve', 0.009633365052315882),\n",
       "  ('substrate', 0.009576102444384577),\n",
       "  ('hand', 0.00945453332538555),\n",
       "  ('resin', 0.009389594794631176),\n",
       "  ('perform', 0.00938719478625727),\n",
       "  ('development', 0.009218834503131611),\n",
       "  ('manipulator', 0.009111419256212925),\n",
       "  ('cut', 0.009007480701838256),\n",
       "  ('production', 0.00896254520540763),\n",
       "  ('ink', 0.0089023656318766),\n",
       "  ('robotics', 0.00887428378098077),\n",
       "  ('base', 0.008869696720523108),\n",
       "  ('fabric', 0.008803886274242272),\n",
       "  ('pattern', 0.008770392134628987),\n",
       "  ('flexible', 0.008711671858608591),\n",
       "  ('shape', 0.00871026408935073),\n",
       "  ('enable', 0.008689699507340476),\n",
       "  ('fabricate', 0.008673863215669002),\n",
       "  ('advantage', 0.008488859382937662),\n",
       "  ('object', 0.008478313061063789),\n",
       "  ('complex', 0.008364432246678766),\n",
       "  ('building', 0.008231708062340947),\n",
       "  ('machine', 0.008148016772771032),\n",
       "  ('temperature', 0.008103539312357157),\n",
       "  ('nozzlebeddistance', 0.008016052270555839),\n",
       "  ('nanoparticle', 0.008016052270555839),\n",
       "  ('fff', 0.008016052270555839),\n",
       "  ('tio2', 0.007906798720924542),\n",
       "  ('technique', 0.00774903965567461),\n",
       "  ('automatic', 0.007622467643825502),\n",
       "  ('soft', 0.007589380325103225),\n",
       "  ('beam', 0.0075083190070830835),\n",
       "  ('quality', 0.007400171106451699),\n",
       "  ('realize', 0.007346311171943923),\n",
       "  ('particle', 0.007340999995952323),\n",
       "  ('head', 0.007284398184153361),\n",
       "  ('support', 0.0072476886221312905),\n",
       "  ('drive', 0.007171902031318185),\n",
       "  ('thigh', 0.007168249591838807),\n",
       "  ('tool', 0.0071647509723978845)],\n",
       " 8: [('fire', 0.26231209958927554),\n",
       "  ('firefighting', 0.11455195704137205),\n",
       "  ('extinguish', 0.11289327472004772),\n",
       "  ('flame', 0.07131136398004492),\n",
       "  ('water', 0.033053895281447365),\n",
       "  ('temperature', 0.032700839064724284),\n",
       "  ('smoke', 0.0322675579478764),\n",
       "  ('fight', 0.031569123897988716),\n",
       "  ('robot', 0.031026128397871576),\n",
       "  ('sensor', 0.025915087763063595),\n",
       "  ('unit', 0.023252326495069305),\n",
       "  ('door', 0.02262838794326323),\n",
       "  ('fireproof', 0.022285386758831315),\n",
       "  ('detection', 0.021472555832577078),\n",
       "  ('control', 0.021147023959273422),\n",
       "  ('alarm', 0.01966019856808694),\n",
       "  ('infrared', 0.019525682458526195),\n",
       "  ('spray', 0.019310058033317146),\n",
       "  ('monitor', 0.01920311794894395),\n",
       "  ('detect', 0.018188204190569036),\n",
       "  ('firefighter', 0.01734430597948894),\n",
       "  ('method', 0.016425965263559644),\n",
       "  ('reconnaissance', 0.016381929115906215),\n",
       "  ('image', 0.015030826237017934),\n",
       "  ('life', 0.014664843650329933),\n",
       "  ('pipe', 0.014603527444194951),\n",
       "  ('injection', 0.014419896172054508),\n",
       "  ('rescue', 0.014153284591607036),\n",
       "  ('module', 0.014140635729611039),\n",
       "  ('device', 0.014124522039906074),\n",
       "  ('fireextinguishing', 0.01395609707150144),\n",
       "  ('system', 0.013780856788722649),\n",
       "  ('emergency', 0.01376757812237835),\n",
       "  ('perform', 0.013565447871018741),\n",
       "  ('adjust', 0.013303907484579951),\n",
       "  ('multisensor', 0.013037526631653036),\n",
       "  ('thermal', 0.01300058962228897),\n",
       "  ('advantage', 0.012845906607493815),\n",
       "  ('draw', 0.01282351055384234),\n",
       "  ('angle', 0.012728195069739635),\n",
       "  ('corridor', 0.012033646380521061),\n",
       "  ('cannon', 0.012008944205454567),\n",
       "  ('realize', 0.011999222431397848),\n",
       "  ('provide', 0.011950192403101339),\n",
       "  ('processing', 0.011927246556316119),\n",
       "  ('monitoring', 0.011419929681067214),\n",
       "  ('rocker', 0.011283120274042649),\n",
       "  ('data', 0.011278149099782059),\n",
       "  ('safety', 0.011278023082805778),\n",
       "  ('building', 0.011270409257018273),\n",
       "  ('heat', 0.0111654101112988),\n",
       "  ('repeater', 0.011165135045356817),\n",
       "  ('involve', 0.011135856651043954),\n",
       "  ('autonomous', 0.011078926455996747),\n",
       "  ('protection', 0.010833853137641621),\n",
       "  ('extinguisher', 0.0108228413909679),\n",
       "  ('operation', 0.010636294845303904),\n",
       "  ('location', 0.01047942278800993),\n",
       "  ('accord', 0.01041747400588825),\n",
       "  ('medium', 0.010094035182211986),\n",
       "  ('send', 0.009935811889474538),\n",
       "  ('leave', 0.009913614874541626),\n",
       "  ('sense', 0.009838400287318309),\n",
       "  ('environment', 0.009776536770521404),\n",
       "  ('source', 0.009723969951993162),\n",
       "  ('realtime', 0.009643482882265143),\n",
       "  ('condition', 0.009637820025888331),\n",
       "  ('communication', 0.009624249417539088),\n",
       "  ('highrise', 0.00952755166385764),\n",
       "  ('signal', 0.009463464707224487),\n",
       "  ('collect', 0.009438559188353056),\n",
       "  ('vision', 0.009127988965587924),\n",
       "  ('enable', 0.009068849132071134),\n",
       "  ('reduce', 0.009019629970749688),\n",
       "  ('view', 0.009015184782577495),\n",
       "  ('connect', 0.008886978753195175),\n",
       "  ('slope', 0.00880069176250489),\n",
       "  ('valve', 0.008772616176313273),\n",
       "  ('inspection', 0.00865236049138798),\n",
       "  ('gas', 0.008524615581398524),\n",
       "  ('firework', 0.008523287311065405),\n",
       "  ('disaster', 0.008483561012861917),\n",
       "  ('air', 0.00830253242973153),\n",
       "  ('rail', 0.008292670075045808),\n",
       "  ('instruction', 0.008283955741561476),\n",
       "  ('camera', 0.008276072505182962),\n",
       "  ('accident', 0.008255761216567308),\n",
       "  ('front', 0.0081964662316167),\n",
       "  ('inside', 0.008096743760210879),\n",
       "  ('process', 0.008069999510351497),\n",
       "  ('base', 0.007996213189108686),\n",
       "  ('chassis', 0.00794887745180856),\n",
       "  ('stereo', 0.007942747269864025),\n",
       "  ('diagram', 0.007926563501793132),\n",
       "  ('escape', 0.007881074293950414),\n",
       "  ('abnormal', 0.007866104444044784),\n",
       "  ('nonenglish', 0.007826201307675768),\n",
       "  ('smart', 0.007707688236667579),\n",
       "  ('danger', 0.00768041516406484),\n",
       "  ('text', 0.00761544677708972)],\n",
       " 9: [('student', 0.157203221377913),\n",
       "  ('education', 0.08382522352003728),\n",
       "  ('robotics', 0.08358483908694711),\n",
       "  ('educational', 0.0761656082554005),\n",
       "  ('engineering', 0.0656061062740463),\n",
       "  ('project', 0.05262212018770349),\n",
       "  ('learn', 0.050211518345799885),\n",
       "  ('science', 0.04402152791452415),\n",
       "  ('lego', 0.03635715615108524),\n",
       "  ('teach', 0.0301533565719598),\n",
       "  ('undergraduate', 0.02873126953230616),\n",
       "  ('design', 0.02871478537285898),\n",
       "  ('laboratory', 0.027775815207578432),\n",
       "  ('technology', 0.02702732127356577),\n",
       "  ('paper', 0.0252702659064832),\n",
       "  ('stem', 0.02434698521580349),\n",
       "  ('curriculum', 0.023451616509107404),\n",
       "  ('development', 0.023295875964479063),\n",
       "  ('develop', 0.02285678914804332),\n",
       "  ('industrial', 0.022223128926939582),\n",
       "  ('activity', 0.021559740599293154),\n",
       "  ('concept', 0.020490247603158776),\n",
       "  ('program', 0.020156328899775703),\n",
       "  ('school', 0.018969285074158192),\n",
       "  ('university', 0.018864141856014274),\n",
       "  ('handson', 0.018399038538322574),\n",
       "  ('robot', 0.018380555487251298),\n",
       "  ('pedagogical', 0.01807294387664672),\n",
       "  ('projectbased', 0.01779117974346986),\n",
       "  ('mindstorms', 0.017544738686693748),\n",
       "  ('study', 0.016827810621161506),\n",
       "  ('mathematics', 0.016361908622763287),\n",
       "  ('knowledge', 0.01627173448589531),\n",
       "  ('approach', 0.016271306087954643),\n",
       "  ('application', 0.016106841617936168),\n",
       "  ('system', 0.015394297594276643),\n",
       "  ('software', 0.015140421302528259),\n",
       "  ('build', 0.014847712119580253),\n",
       "  ('manufacture', 0.014752734615137769),\n",
       "  ('virtual', 0.0144519787047961),\n",
       "  ('practice', 0.014418642936384639),\n",
       "  ('learning', 0.014387364786740004),\n",
       "  ('manipulator', 0.01433134615497363),\n",
       "  ('experience', 0.014161243734449406),\n",
       "  ('public', 0.014073229369537803),\n",
       "  ('mobile', 0.014019451316562405),\n",
       "  ('thinking', 0.014014382373383703),\n",
       "  ('support', 0.013874860401524613),\n",
       "  ('robotic', 0.013873577460570228),\n",
       "  ('reality', 0.013869323658970015),\n",
       "  ('skill', 0.013817700523965797),\n",
       "  ('hardware', 0.013496549253726335),\n",
       "  ('lab', 0.012967276972457689),\n",
       "  ('embed', 0.012600914411989388),\n",
       "  ('team', 0.012588034885989516),\n",
       "  ('aim', 0.011864511369492218),\n",
       "  ('department', 0.01182043147301755),\n",
       "  ('automation', 0.011784702245734892),\n",
       "  ('graduate', 0.011500964285138821),\n",
       "  ('result', 0.011454263834452518),\n",
       "  ('apply', 0.011365400957166254),\n",
       "  ('class', 0.011144405513170344),\n",
       "  ('professional', 0.011128895631959965),\n",
       "  ('experiment', 0.01072392546020532),\n",
       "  ('lowcost', 0.010628564575492038),\n",
       "  ('provide', 0.010619332118969831),\n",
       "  ('industry', 0.010567944863422083),\n",
       "  ('task', 0.010494259422472712),\n",
       "  ('tool', 0.010474101942731356),\n",
       "  ('algebra', 0.010342367195425172),\n",
       "  ('increase', 0.010338007236024412),\n",
       "  ('scrap', 0.010099725877222698),\n",
       "  ('parametric', 0.010052476779870314),\n",
       "  ('motivate', 0.010010665048028024),\n",
       "  ('basic', 0.009900718466563093),\n",
       "  ('rosi', 0.009857969387261847),\n",
       "  ('kit', 0.009836675743316462),\n",
       "  ('engineer', 0.009711287934928595),\n",
       "  ('control', 0.009695504752844166),\n",
       "  ('computational', 0.009638715661502935),\n",
       "  ('institute', 0.0095438268146246),\n",
       "  ('survey', 0.009506595910846584),\n",
       "  ('technical', 0.009494219469025547),\n",
       "  ('participant', 0.009350721246082322),\n",
       "  ('classroom', 0.009342921582255801),\n",
       "  ('exponential', 0.009339268321902117),\n",
       "  ('offer', 0.009307750942663727),\n",
       "  ('opportunity', 0.009256298810149808),\n",
       "  ('augment', 0.009219836219342711),\n",
       "  ('addition', 0.009115741793033422),\n",
       "  ('model', 0.009091008664477512),\n",
       "  ('remotemanipulation', 0.009070190983463188),\n",
       "  ('computer', 0.009061295969229102),\n",
       "  ('gear', 0.009028730409544753),\n",
       "  ('level', 0.00893651488589354),\n",
       "  ('psychomotor', 0.00890700300517595),\n",
       "  ('academic', 0.008764105996060654),\n",
       "  ('advance', 0.00873093440361176),\n",
       "  ('sensor', 0.008709120651536967),\n",
       "  ('propose', 0.00866968226599769)],\n",
       " 10: [('weed', 0.11839597176420981),\n",
       "  ('spray', 0.11534292614001408),\n",
       "  ('crop', 0.11439219251788646),\n",
       "  ('pesticide', 0.08710128618460475),\n",
       "  ('plant', 0.04241003274393318),\n",
       "  ('agricultural', 0.038375434620699374),\n",
       "  ('greenhouse', 0.03277615872755257),\n",
       "  ('row', 0.03192533124713849),\n",
       "  ('disease', 0.030887055504736253),\n",
       "  ('sprayer', 0.030711729377916244),\n",
       "  ('pest', 0.029019484653823712),\n",
       "  ('image', 0.028752855062014908),\n",
       "  ('herbicide', 0.02871337014310546),\n",
       "  ('flower', 0.025904602445063114),\n",
       "  ('nectar', 0.02565115017813915),\n",
       "  ('insect', 0.025609613988926073),\n",
       "  ('system', 0.0221463622293842),\n",
       "  ('chemical', 0.022048976131775366),\n",
       "  ('agriculture', 0.021698500329682104),\n",
       "  ('robot', 0.020443743439646753),\n",
       "  ('application', 0.018724831899644422),\n",
       "  ('spraying', 0.018677572979284882),\n",
       "  ('control', 0.018353031323350606),\n",
       "  ('seed', 0.017824092489093727),\n",
       "  ('field', 0.01706482511495664),\n",
       "  ('pollination', 0.017056341001527326),\n",
       "  ('result', 0.015761335757938855),\n",
       "  ('vision', 0.015605916618585807),\n",
       "  ('variable', 0.0152726670818861),\n",
       "  ('intelligent', 0.014904146132634456),\n",
       "  ('decisionmaking', 0.014626451597368112),\n",
       "  ('moth', 0.014278043279363814),\n",
       "  ('identification', 0.014252714823694933),\n",
       "  ('larva', 0.013814116838047029),\n",
       "  ('autonomous', 0.013775556649098594),\n",
       "  ('experiment', 0.013724305265007999),\n",
       "  ('reduce', 0.013707251281712787),\n",
       "  ('treatment', 0.013662668287571728),\n",
       "  ('farm', 0.013625757885002393),\n",
       "  ('grapevine', 0.013574493050153924),\n",
       "  ('precision', 0.013546732523654988),\n",
       "  ('method', 0.012711486684282894),\n",
       "  ('mobile', 0.012631073395857678),\n",
       "  ('pollen', 0.012596651381414683),\n",
       "  ('vehicle', 0.01254068965879987),\n",
       "  ('selective', 0.012249193930555131),\n",
       "  ('sow', 0.012091451939093214),\n",
       "  ('rate', 0.011910574367723515),\n",
       "  ('apply', 0.011894786446520087),\n",
       "  ('rice', 0.011846574502861112),\n",
       "  ('ridge', 0.011846574502861112),\n",
       "  ('fuzzy', 0.011830707150764723),\n",
       "  ('target', 0.011379856867216962),\n",
       "  ('harrisia', 0.01133517604650347),\n",
       "  ('collect', 0.011266484258144362),\n",
       "  ('tree', 0.011221461560065232),\n",
       "  ('accuracy', 0.01104351889386344),\n",
       "  ('navigation', 0.011005057019763159),\n",
       "  ('leaf', 0.010807131572066128),\n",
       "  ('curtain', 0.010767513803664547),\n",
       "  ('canopy', 0.010767513803664547),\n",
       "  ('machine', 0.010665248015971875),\n",
       "  ('white', 0.01047074030878607),\n",
       "  ('development', 0.01040768566816156),\n",
       "  ('vineyard', 0.010320618837027236),\n",
       "  ('base', 0.010179231871514422),\n",
       "  ('fly', 0.009949616868579779),\n",
       "  ('robotic', 0.009777735581755357),\n",
       "  ('reclamation', 0.009591444843233836),\n",
       "  ('screen', 0.009558785135426434),\n",
       "  ('design', 0.009265130561655885),\n",
       "  ('coverage', 0.009135276969917849),\n",
       "  ('unit', 0.009056765971156558),\n",
       "  ('processing', 0.008976270135606946),\n",
       "  ('precise', 0.008939227437904953),\n",
       "  ('cost', 0.008927734115857186),\n",
       "  ('farmer', 0.008880093177009345),\n",
       "  ('nozzle', 0.008856447988505193),\n",
       "  ('detect', 0.008728691088626226),\n",
       "  ('orchard', 0.008620304927691889),\n",
       "  ('network', 0.008615731309646688),\n",
       "  ('develop', 0.00860159471774784),\n",
       "  ('operation', 0.008596372021600459),\n",
       "  ('perform', 0.008592776364047061),\n",
       "  ('data', 0.00851412847834406),\n",
       "  ('frame', 0.008459005155906545),\n",
       "  ('sensor', 0.008363186523523646),\n",
       "  ('medicine', 0.008294823338238699),\n",
       "  ('propose', 0.00828450430022096),\n",
       "  ('camera', 0.008232386491959122),\n",
       "  ('smart', 0.008214645527474787),\n",
       "  ('solution', 0.008178297982453812),\n",
       "  ('achieve', 0.008162587506811899),\n",
       "  ('pollinate', 0.008144695830092355),\n",
       "  ('carry', 0.008020531285662305),\n",
       "  ('accord', 0.008018589124487645),\n",
       "  ('remote', 0.00801321383677229),\n",
       "  ('test', 0.007881785283433397),\n",
       "  ('bat', 0.007740464127770427),\n",
       "  ('growth', 0.00771088490450229)],\n",
       " 11: [('emotion', 0.25785540834504606),\n",
       "  ('emotional', 0.13512016959100825),\n",
       "  ('expression', 0.11033815591144433),\n",
       "  ('user', 0.06788788361456254),\n",
       "  ('facial', 0.062236258916942455),\n",
       "  ('interaction', 0.04161329192773424),\n",
       "  ('feel', 0.04010277702380129),\n",
       "  ('intelligent', 0.034462206009346324),\n",
       "  ('mood', 0.0341331325151361),\n",
       "  ('humancomputer', 0.0325438105301327),\n",
       "  ('robot', 0.032041549488721684),\n",
       "  ('feeling', 0.028174458925979824),\n",
       "  ('response', 0.02720165475142648),\n",
       "  ('data', 0.025766609015412768),\n",
       "  ('method', 0.02476872080398582),\n",
       "  ('recognition', 0.022579188807825317),\n",
       "  ('artificial', 0.02247865628377232),\n",
       "  ('express', 0.022416532905238058),\n",
       "  ('model', 0.021681022264818606),\n",
       "  ('display', 0.0211204213545564),\n",
       "  ('process', 0.02050388234675697),\n",
       "  ('animate', 0.02013666023749419),\n",
       "  ('eye', 0.02012269362649703),\n",
       "  ('language', 0.019588588306802063),\n",
       "  ('parameter', 0.019563640004053195),\n",
       "  ('base', 0.01915801769894379),\n",
       "  ('human', 0.017993165559381283),\n",
       "  ('involve', 0.01775449129575742),\n",
       "  ('comfort', 0.017730636507687365),\n",
       "  ('correspond', 0.017371233926355072),\n",
       "  ('customer', 0.01728149320173516),\n",
       "  ('companion', 0.016917471438714873),\n",
       "  ('unit', 0.01691434040175052),\n",
       "  ('system', 0.016633276883489617),\n",
       "  ('behavior', 0.016243693155097525),\n",
       "  ('processing', 0.016243385715296012),\n",
       "  ('input', 0.0160660767687858),\n",
       "  ('multimodal', 0.016053498194294497),\n",
       "  ('object', 0.016021588837390164),\n",
       "  ('module', 0.01557008679991076),\n",
       "  ('draw', 0.015542564171238962),\n",
       "  ('generate', 0.015172124295055189),\n",
       "  ('text', 0.015158003260721828),\n",
       "  ('nonenglish', 0.015144786913806562),\n",
       "  ('interactive', 0.01490383371574588),\n",
       "  ('accord', 0.014618891669965153),\n",
       "  ('attractionrelated', 0.014563343349931876),\n",
       "  ('action', 0.014498801204438461),\n",
       "  ('biorhythm', 0.014402608798968809),\n",
       "  ('advantage', 0.014362754821360171),\n",
       "  ('experience', 0.014247966048385153),\n",
       "  ('output', 0.013971379836548177),\n",
       "  ('diagram', 0.013871792845255729),\n",
       "  ('modeling', 0.013814766273365572),\n",
       "  ('pet', 0.013723142224086776),\n",
       "  ('determine', 0.013453454253197045),\n",
       "  ('illustrate', 0.013433753002607459),\n",
       "  ('claim', 0.013414190119013914),\n",
       "  ('image', 0.013296794136154717),\n",
       "  ('humanoid', 0.013203315283942398),\n",
       "  ('emoticon', 0.013104916195482907),\n",
       "  ('physiological', 0.012940362813497423),\n",
       "  ('interact', 0.012861107829964219),\n",
       "  ('independent', 0.012767288264091252),\n",
       "  ('database', 0.012622376579824119),\n",
       "  ('provide', 0.012569840061147117),\n",
       "  ('receive', 0.012439980149438694),\n",
       "  ('set', 0.01224419342074094),\n",
       "  ('signal', 0.012196717729181772),\n",
       "  ('store', 0.01204923717487759),\n",
       "  ('result', 0.011714222614272235),\n",
       "  ('sensor', 0.01165957448275222),\n",
       "  ('word', 0.011327672378996453),\n",
       "  ('current', 0.011320700689248732),\n",
       "  ('step', 0.011231339167651844),\n",
       "  ('sense', 0.011196552058913418),\n",
       "  ('parse', 0.011001321288447889),\n",
       "  ('instruction', 0.010916078877392418),\n",
       "  ('characteristic', 0.010817289646213474),\n",
       "  ('enable', 0.010429407104928049),\n",
       "  ('touch', 0.010421829995925044),\n",
       "  ('voice', 0.010407084291105338),\n",
       "  ('software', 0.010240766400591244),\n",
       "  ('screen', 0.01020108982595876),\n",
       "  ('attention', 0.009872855169916234),\n",
       "  ('analysis', 0.009306839429387667),\n",
       "  ('detect', 0.009174077767330497),\n",
       "  ('sensibility', 0.008948968528800528),\n",
       "  ('collect', 0.008683666456523088),\n",
       "  ('animation', 0.008677278003257372),\n",
       "  ('fuzzy', 0.008638619152386085),\n",
       "  ('perform', 0.008462595044134423),\n",
       "  ('level', 0.008462344830073118),\n",
       "  ('field', 0.008455339206451768),\n",
       "  ('affective', 0.008451135468269418),\n",
       "  ('selection', 0.00834976647393142),\n",
       "  ('improve', 0.008344802174030101),\n",
       "  ('service', 0.008277177507528287),\n",
       "  ('nervous', 0.00821769501029118),\n",
       "  ('block', 0.008148201534634253)],\n",
       " 12: [('food', 0.20074447834374226),\n",
       "  ('dish', 0.1494049575457043),\n",
       "  ('cook', 0.1458867731193299),\n",
       "  ('kitchen', 0.06613440412098566),\n",
       "  ('meal', 0.06018325811703335),\n",
       "  ('cooking', 0.05634000346774576),\n",
       "  ('menu', 0.04795191164811173),\n",
       "  ('recipe', 0.043170222928609885),\n",
       "  ('fry', 0.04032054364985602),\n",
       "  ('restaurant', 0.03927063108622242),\n",
       "  ('ingredient', 0.03732864490707853),\n",
       "  ('din', 0.03669716659545772),\n",
       "  ('item', 0.03378157058317554),\n",
       "  ('cooker', 0.03254491749674146),\n",
       "  ('process', 0.029589250497820494),\n",
       "  ('tea', 0.028670039431565413),\n",
       "  ('delivery', 0.02606648786680495),\n",
       "  ('pan', 0.02579479750348778),\n",
       "  ('method', 0.025548348910567235),\n",
       "  ('customer', 0.025384344720377414),\n",
       "  ('weight', 0.021803632840853782),\n",
       "  ('module', 0.021599919966736537),\n",
       "  ('robot', 0.02159567562915782),\n",
       "  ('prepare', 0.021416901915103113),\n",
       "  ('processing', 0.020324755087928078),\n",
       "  ('time', 0.020245263147488902),\n",
       "  ('data', 0.01927833871922526),\n",
       "  ('taste', 0.018876419113494497),\n",
       "  ('involve', 0.018526150507229954),\n",
       "  ('pot', 0.018343256942986993),\n",
       "  ('serve', 0.01828923452752489),\n",
       "  ('cater', 0.01773154509710119),\n",
       "  ('control', 0.017381735247147385),\n",
       "  ('accord', 0.017108821851193185),\n",
       "  ('salt', 0.01707941829235925),\n",
       "  ('heat', 0.016544816828093563),\n",
       "  ('system', 0.016105118159463385),\n",
       "  ('receive', 0.0157348849736312),\n",
       "  ('client', 0.015646030355229285),\n",
       "  ('claim', 0.015453930847602352),\n",
       "  ('merchant', 0.015171262545957034),\n",
       "  ('instruction', 0.015062571141418221),\n",
       "  ('preparation', 0.014851245341474192),\n",
       "  ('base', 0.014740379084456978),\n",
       "  ('table', 0.014527367977471166),\n",
       "  ('advantage', 0.014399597244837145),\n",
       "  ('breakfast', 0.014261149140313437),\n",
       "  ('vegetable', 0.014180185407836112),\n",
       "  ('chef', 0.01349803468585059),\n",
       "  ('intelligent', 0.01329431361543091),\n",
       "  ('set', 0.013230479825791236),\n",
       "  ('server', 0.0127600023588568),\n",
       "  ('provide', 0.012719312096845464),\n",
       "  ('target', 0.012525692757694634),\n",
       "  ('user', 0.012525064309789722),\n",
       "  ('finish', 0.012160151917355626),\n",
       "  ('determine', 0.01213421503628612),\n",
       "  ('independent', 0.012085617367343707),\n",
       "  ('gyroscope', 0.011825909485630979),\n",
       "  ('storage', 0.011739401832805498),\n",
       "  ('adjust', 0.011704965084374791),\n",
       "  ('arm', 0.011703825282372743),\n",
       "  ('draw', 0.011680504105757494),\n",
       "  ('divide', 0.011384894407236267),\n",
       "  ('tilt', 0.011216655184400166),\n",
       "  ('robotized', 0.01116364643782339),\n",
       "  ('device', 0.011162456317271592),\n",
       "  ('management', 0.011141052940414852),\n",
       "  ('plate', 0.011118217004444863),\n",
       "  ('robotic', 0.011069747122770838),\n",
       "  ('nutritional', 0.010969583243614783),\n",
       "  ('supply', 0.010853998249768638),\n",
       "  ('occupy', 0.010768002960137576),\n",
       "  ('screw', 0.01051830958519355),\n",
       "  ('smoke', 0.010482259094314736),\n",
       "  ('image', 0.010416704994578573),\n",
       "  ('detailed', 0.010318258663381858),\n",
       "  ('waiter', 0.010164225676497038),\n",
       "  ('add', 0.01008951908215587),\n",
       "  ('characteristic', 0.010004336889398202),\n",
       "  ('oven', 0.009897391926796667),\n",
       "  ('perform', 0.009728209628619018),\n",
       "  ('display', 0.009694765124698721),\n",
       "  ('apparatus', 0.009646189584652196),\n",
       "  ('soup', 0.009624738625143634),\n",
       "  ('prestored', 0.009544079306541898),\n",
       "  ('store', 0.009530132367878877),\n",
       "  ('return', 0.009455087435540991),\n",
       "  ('multiple', 0.009398720504795333),\n",
       "  ('improve', 0.009397391472160375),\n",
       "  ('slave', 0.009147242780623083),\n",
       "  ('season', 0.00899868979056706),\n",
       "  ('product', 0.008998268487230102),\n",
       "  ('controller', 0.00899484124305422),\n",
       "  ('move', 0.008969799308626713),\n",
       "  ('enable', 0.008936369264271953),\n",
       "  ('cookware', 0.008934416310170955),\n",
       "  ('nonenglish', 0.008898316534317222),\n",
       "  ('leaf', 0.00889830222401195),\n",
       "  ('replication', 0.008817118359766498)],\n",
       " 13: [('park', 0.4062483799235324),\n",
       "  ('vehicle', 0.17074217861877067),\n",
       "  ('parking', 0.10618935621704494),\n",
       "  ('car', 0.0787290963877489),\n",
       "  ('garage', 0.07391054680715048),\n",
       "  ('space', 0.06043464369941806),\n",
       "  ('robot', 0.029795380850938406),\n",
       "  ('lot', 0.027688917071211114),\n",
       "  ('intelligent', 0.026122985117508563),\n",
       "  ('access', 0.02555763002522634),\n",
       "  ('module', 0.025484466891421136),\n",
       "  ('store', 0.02524604986108283),\n",
       "  ('illegal', 0.02515456810327435),\n",
       "  ('system', 0.025141103225562615),\n",
       "  ('position', 0.022588369801735602),\n",
       "  ('route', 0.022372626604134877),\n",
       "  ('plate', 0.02103786255646936),\n",
       "  ('guide', 0.02089691751847225),\n",
       "  ('hall', 0.02063615090816666),\n",
       "  ('driver', 0.020625565734695175),\n",
       "  ('camera', 0.018517439272810427),\n",
       "  ('server', 0.018298947577063514),\n",
       "  ('automatic', 0.018142233693040605),\n",
       "  ('lift', 0.017421624555429956),\n",
       "  ('management', 0.017391884942603887),\n",
       "  ('provide', 0.01723540018385572),\n",
       "  ('path', 0.017058735723207347),\n",
       "  ('channel', 0.016508633863963864),\n",
       "  ('automobile', 0.01634331243378119),\n",
       "  ('method', 0.016338548659406205),\n",
       "  ('device', 0.016237208531998015),\n",
       "  ('connect', 0.016055663608912567),\n",
       "  ('transport', 0.015635797748538502),\n",
       "  ('time', 0.015629678917512577),\n",
       "  ('retrieval', 0.015352679437718841),\n",
       "  ('draw', 0.015270348923786448),\n",
       "  ('unit', 0.015222845642029215),\n",
       "  ('freight', 0.01479846174349788),\n",
       "  ('handle', 0.014634659310991019),\n",
       "  ('vehiclecarrying', 0.014391952493403384),\n",
       "  ('arrange', 0.01411885061534215),\n",
       "  ('carry', 0.013745451279863529),\n",
       "  ('accord', 0.013477851243774793),\n",
       "  ('road', 0.013438869763618654),\n",
       "  ('send', 0.01311770113925284),\n",
       "  ('move', 0.012960918933837209),\n",
       "  ('data', 0.012874738081706943),\n",
       "  ('advantage', 0.012546238727091165),\n",
       "  ('control', 0.01247539441812754),\n",
       "  ('license', 0.012324500752873294),\n",
       "  ('exit', 0.012315459439540228),\n",
       "  ('request', 0.012181691646174336),\n",
       "  ('schedule', 0.01199902150264149),\n",
       "  ('transmit', 0.011855089154929348),\n",
       "  ('navigation', 0.011685174196733067),\n",
       "  ('involve', 0.011649091314911757),\n",
       "  ('language', 0.01158394375113534),\n",
       "  ('diagram', 0.011566581133739666),\n",
       "  ('drive', 0.011563441741034127),\n",
       "  ('empty', 0.01146238486844563),\n",
       "  ('mobile', 0.011315435772391661),\n",
       "  ('unparking', 0.01125243545878165),\n",
       "  ('detect', 0.011219312707205211),\n",
       "  ('nonenglish', 0.011064559011924683),\n",
       "  ('block', 0.01100002819581238),\n",
       "  ('text', 0.01076659760650917),\n",
       "  ('owner', 0.010693049277027555),\n",
       "  ('base', 0.010649561478144498),\n",
       "  ('claim', 0.010527080221555588),\n",
       "  ('andor', 0.010505672793890513),\n",
       "  ('background', 0.01027103767445961),\n",
       "  ('guidance', 0.0102405229454936),\n",
       "  ('process', 0.010197942911598734),\n",
       "  ('processing', 0.010032639395080117),\n",
       "  ('signal', 0.009909103770799546),\n",
       "  ('storage', 0.00987256308592932),\n",
       "  ('receive', 0.009796445292484614),\n",
       "  ('agv', 0.009626426633285674),\n",
       "  ('corridor', 0.009616031031550941),\n",
       "  ('fork', 0.009595840745158589),\n",
       "  ('refuel', 0.009594488078803908),\n",
       "  ('independent', 0.009462775910274444),\n",
       "  ('track', 0.009441675742457875),\n",
       "  ('share', 0.009272162384319691),\n",
       "  ('image', 0.009239279660900003),\n",
       "  ('confirm', 0.00895331815599621),\n",
       "  ('multistorey', 0.00889569348171012),\n",
       "  ('threedimensional', 0.008874280209956386),\n",
       "  ('convey', 0.008869672712083686),\n",
       "  ('arrangement', 0.008751423738892487),\n",
       "  ('user', 0.008750730656403293),\n",
       "  ('register', 0.008721732683446032),\n",
       "  ('charge', 0.008685368708205224),\n",
       "  ('motor', 0.008679536029174522),\n",
       "  ('distance', 0.008633955367094773),\n",
       "  ('collection', 0.008571246191759415),\n",
       "  ('judge', 0.008390208513653527),\n",
       "  ('main', 0.0082426991206882),\n",
       "  ('sensor', 0.008220218145668682),\n",
       "  ('arm', 0.008207028189625959)],\n",
       " 14: [('temperature', 0.3484726647993012),\n",
       "  ('heat', 0.036049395781519264),\n",
       "  ('thermal', 0.03283893616932227),\n",
       "  ('compensation', 0.031232623710278882),\n",
       "  ('infrared', 0.03004853460701353),\n",
       "  ('error', 0.029570025966797208),\n",
       "  ('industrial', 0.02865076625999498),\n",
       "  ('device', 0.028613888023508116),\n",
       "  ('motor', 0.02799612046857144),\n",
       "  ('sensor', 0.027483377790758497),\n",
       "  ('body', 0.027434594327087385),\n",
       "  ('robot', 0.027430979246064614),\n",
       "  ('measurement', 0.026338374992086834),\n",
       "  ('compensate', 0.025333940808669762),\n",
       "  ('method', 0.025284402057831074),\n",
       "  ('measure', 0.025019626678509047),\n",
       "  ('thermometer', 0.024059017002136588),\n",
       "  ('offset', 0.022978553546494942),\n",
       "  ('output', 0.02244552705519597),\n",
       "  ('vehicle', 0.021567219157891913),\n",
       "  ('threshold', 0.018914325446739766),\n",
       "  ('visor', 0.018278545196010243),\n",
       "  ('detect', 0.017847387523765537),\n",
       "  ('control', 0.01715678014094072),\n",
       "  ('data', 0.01707834006538426),\n",
       "  ('current', 0.0166797591200621),\n",
       "  ('determine', 0.01644116061402882),\n",
       "  ('temperaturecompensated', 0.01606827220900558),\n",
       "  ('accuracy', 0.01602485082045716),\n",
       "  ('rise', 0.015953412459782504),\n",
       "  ('gage', 0.01579092170258599),\n",
       "  ('subject', 0.01578237562004624),\n",
       "  ('shelter', 0.015495607615886376),\n",
       "  ('involve', 0.015342927291434487),\n",
       "  ('sun', 0.015197190583769725),\n",
       "  ('amd', 0.014216646263563523),\n",
       "  ('unit', 0.01415286440140799),\n",
       "  ('test', 0.01412802613633706),\n",
       "  ('color', 0.013792546252059435),\n",
       "  ('advantage', 0.013734693526436255),\n",
       "  ('position', 0.013706694886235084),\n",
       "  ('lmpa', 0.013669018403571376),\n",
       "  ('model', 0.013205818401831802),\n",
       "  ('condition', 0.01304181603503187),\n",
       "  ('module', 0.013028076884067173),\n",
       "  ('claim', 0.012874768431249312),\n",
       "  ('arm', 0.012794815153500554),\n",
       "  ('draw', 0.012702604697139444),\n",
       "  ('silicon', 0.012683766091389274),\n",
       "  ('change', 0.01249082208276451),\n",
       "  ('calibration', 0.01244293338566699),\n",
       "  ('base', 0.01236618015385562),\n",
       "  ('estimate', 0.012256165982953916),\n",
       "  ('mechanical', 0.012113605405453563),\n",
       "  ('removable', 0.011787314411656381),\n",
       "  ('speed', 0.01167093550308705),\n",
       "  ('collect', 0.011580108022067884),\n",
       "  ('drift', 0.011472089798129173),\n",
       "  ('windscreen', 0.011300919361539017),\n",
       "  ('saturation', 0.011247944370656652),\n",
       "  ('low', 0.011166084928642935),\n",
       "  ('volleyball', 0.01078001847523944),\n",
       "  ('independent', 0.010682869995726853),\n",
       "  ('calculate', 0.010605210075434178),\n",
       "  ('element', 0.010514511633596386),\n",
       "  ('thermostat', 0.010422086196748512),\n",
       "  ('preset', 0.010255856054485219),\n",
       "  ('regulate', 0.01023272701818467),\n",
       "  ('equipment', 0.010118769185312891),\n",
       "  ('system', 0.010086414330469341),\n",
       "  ('mobile', 0.009997360219700118),\n",
       "  ('normal', 0.009811400939942632),\n",
       "  ('growth', 0.009790362908003706),\n",
       "  ('actuator', 0.009708309119700052),\n",
       "  ('operate', 0.009636865306999478),\n",
       "  ('operation', 0.009595295775337992),\n",
       "  ('shaft', 0.009455107607720108),\n",
       "  ('calibrate', 0.009444929872883865),\n",
       "  ('overheat', 0.009359922934644382),\n",
       "  ('trend', 0.009304615511590815),\n",
       "  ('nonenglish', 0.009232611951837468),\n",
       "  ('set', 0.009008690013295406),\n",
       "  ('text', 0.008983983693823683),\n",
       "  ('manipulator', 0.00896471440332393),\n",
       "  ('language', 0.008892722504169448),\n",
       "  ('ambient', 0.008880098399384924),\n",
       "  ('arxpls', 0.008813917421723123),\n",
       "  ('process', 0.008803926234746651),\n",
       "  ('diagram', 0.008705287871719527),\n",
       "  ('drive', 0.00870292508906767),\n",
       "  ('distribution', 0.008661513335689446),\n",
       "  ('person', 0.008652172703236942),\n",
       "  ('rate', 0.008641501828497274),\n",
       "  ('detection', 0.0086093273503666),\n",
       "  ('reduce', 0.00843822277484163),\n",
       "  ('provide', 0.008414126130009287),\n",
       "  ('component', 0.008409760011490684),\n",
       "  ('accumulate', 0.00833507375754508),\n",
       "  ('time', 0.00830348699237264),\n",
       "  ('health', 0.00822141420223054)],\n",
       " 15: [('nanowire', 0.08403298136325342),\n",
       "  ('afm', 0.07520291743573992),\n",
       "  ('nanomanipulation', 0.06896001313843338),\n",
       "  ('nanomanipulator', 0.05642282781854099),\n",
       "  ('microscope', 0.05586429426872812),\n",
       "  ('manipulation', 0.05509841659743581),\n",
       "  ('cnt', 0.04987890901976978),\n",
       "  ('micronano', 0.04478441681369025),\n",
       "  ('assembly', 0.04283676107981162),\n",
       "  ('nano', 0.04158170503971416),\n",
       "  ('cantilever', 0.04132622965467365),\n",
       "  ('atomic', 0.04120847077124848),\n",
       "  ('force', 0.035755269318377365),\n",
       "  ('sem', 0.035668972312982786),\n",
       "  ('feedback', 0.0348022005398164),\n",
       "  ('metatasks', 0.030349242571993854),\n",
       "  ('nanowires', 0.027333345911440734),\n",
       "  ('nanorobotic', 0.02709704605710298),\n",
       "  ('microscopy', 0.02698483069582395),\n",
       "  ('substrate', 0.025531403927147773),\n",
       "  ('nanotube', 0.025432798438688425),\n",
       "  ('sample', 0.024944150430812613),\n",
       "  ('electron', 0.02424911027389198),\n",
       "  ('contact', 0.024199806256945643),\n",
       "  ('nanoscale', 0.0224455090588964),\n",
       "  ('technique', 0.02201938693123216),\n",
       "  ('carbon', 0.020476753407971754),\n",
       "  ('probe', 0.01938729821256129),\n",
       "  ('model', 0.018325168730029366),\n",
       "  ('structure', 0.01783832422798769),\n",
       "  ('base', 0.017636705120522032),\n",
       "  ('vdw', 0.017627818879331392),\n",
       "  ('switch', 0.017592553350758777),\n",
       "  ('stabilize', 0.017222652175289968),\n",
       "  ('crystal', 0.01720894083455375),\n",
       "  ('microchannel', 0.016722958233464622),\n",
       "  ('handle', 0.016673699396970953),\n",
       "  ('paper', 0.016670765320769432),\n",
       "  ('robotic', 0.016495574148331197),\n",
       "  ('fabrication', 0.016200714970430963),\n",
       "  ('strategy', 0.01618402504336691),\n",
       "  ('assemble', 0.015421705385330688),\n",
       "  ('nanoparticles', 0.015326391362065985),\n",
       "  ('cellular', 0.015239612510468827),\n",
       "  ('scan', 0.015168855744309472),\n",
       "  ('nanostructures', 0.014958986369538048),\n",
       "  ('heterostructures', 0.014958986369538048),\n",
       "  ('nmc', 0.014958986369538048),\n",
       "  ('manipulator', 0.014927956668068192),\n",
       "  ('learn', 0.01478771465897118),\n",
       "  ('nems', 0.014689849066109494),\n",
       "  ('nanobits', 0.014689849066109494),\n",
       "  ('surface', 0.014420115649556605),\n",
       "  ('electrode', 0.014222952137693406),\n",
       "  ('der', 0.01409132342965721),\n",
       "  ('waals', 0.01409132342965721),\n",
       "  ('railguided', 0.013795110259997207),\n",
       "  ('array', 0.013584943577007392),\n",
       "  ('beam', 0.01354626283385967),\n",
       "  ('electric', 0.013347570419586946),\n",
       "  ('insitu', 0.013154514321956405),\n",
       "  ('resolution', 0.013080526223565354),\n",
       "  ('van', 0.013068182511375205),\n",
       "  ('design', 0.012915757395345055),\n",
       "  ('graphene', 0.012912225902419156),\n",
       "  ('manufacture', 0.012744759812191649),\n",
       "  ('propose', 0.012709732017941304),\n",
       "  ('operation', 0.0126492458331515),\n",
       "  ('precise', 0.01246144262312021),\n",
       "  ('twodimensional', 0.01246144262312021),\n",
       "  ('deposition', 0.012391498489869495),\n",
       "  ('distributedparameters', 0.012230709147357154),\n",
       "  ('vascularlike', 0.012230709147357154),\n",
       "  ('chargedparticle', 0.012230709147357154),\n",
       "  ('lumpedparameters', 0.012230709147357154),\n",
       "  ('nanomechanical', 0.012230709147357154),\n",
       "  ('error', 0.01222262661751287),\n",
       "  ('bend', 0.01211021185339301),\n",
       "  ('atomically', 0.011967189095630439),\n",
       "  ('atomicforce', 0.011967189095630439),\n",
       "  ('threedimensional', 0.011916216827541083),\n",
       "  ('suspend', 0.011791507388775381),\n",
       "  ('device', 0.011787810933806073),\n",
       "  ('fuse', 0.011508551706178045),\n",
       "  ('oxygen', 0.011367016821774628),\n",
       "  ('process', 0.011277087498346872),\n",
       "  ('characterization', 0.011266344728186781),\n",
       "  ('develop', 0.01120706569626848),\n",
       "  ('visual', 0.010941319591515565),\n",
       "  ('dmp', 0.010933338364576294),\n",
       "  ('manipulate', 0.010806583040530887),\n",
       "  ('cnts', 0.010751307321326538),\n",
       "  ('servoing', 0.010593368604841094),\n",
       "  ('piezoresistive', 0.010508492876784365),\n",
       "  ('publication', 0.010454546009100165),\n",
       "  ('image', 0.01042131823859743),\n",
       "  ('system', 0.010416000407183343),\n",
       "  ('microassembly', 0.010318787820764052),\n",
       "  ('holonomic', 0.010066652956977217),\n",
       "  ('method', 0.010065690268270706)],\n",
       " 16: [('brake', 0.4662014266467389),\n",
       "  ('motor', 0.07376402867223125),\n",
       "  ('release', 0.05063512031923192),\n",
       "  ('drive', 0.04711226049727451),\n",
       "  ('torque', 0.042345542790025836),\n",
       "  ('shaft', 0.035625305239926644),\n",
       "  ('robot', 0.0342469356658508),\n",
       "  ('arm', 0.03395987897059469),\n",
       "  ('test', 0.03346017779832914),\n",
       "  ('manipulator', 0.02866269230994726),\n",
       "  ('detect', 0.027952044277258586),\n",
       "  ('braking', 0.02731575071724665),\n",
       "  ('solenoid', 0.027160554479965196),\n",
       "  ('pedal', 0.027092498873474407),\n",
       "  ('control', 0.025774880947890252),\n",
       "  ('unit', 0.024540699079934846),\n",
       "  ('method', 0.02356030178244795),\n",
       "  ('abnormality', 0.02336112993849547),\n",
       "  ('industrial', 0.022795098974651148),\n",
       "  ('operation', 0.021588811104501955),\n",
       "  ('electromagnet', 0.02129405608796827),\n",
       "  ('movement', 0.021103794289265447),\n",
       "  ('load', 0.020692803259409625),\n",
       "  ('permanent', 0.0177164935432445),\n",
       "  ('emergency', 0.017649140208279426),\n",
       "  ('involve', 0.01730356891378231),\n",
       "  ('direction', 0.017135420416162638),\n",
       "  ('safety', 0.016385384808438205),\n",
       "  ('force', 0.01619017038535871),\n",
       "  ('caliper', 0.015934187918393877),\n",
       "  ('claim', 0.015832394460196696),\n",
       "  ('power', 0.015577507919016303),\n",
       "  ('pin', 0.015526176400404929),\n",
       "  ('determine', 0.015259682755491057),\n",
       "  ('advantage', 0.015247793739193688),\n",
       "  ('magnet', 0.01495872051365546),\n",
       "  ('joint', 0.014949239045140023),\n",
       "  ('distance', 0.014620367454073947),\n",
       "  ('product', 0.01451081316515905),\n",
       "  ('draw', 0.014504917900037752),\n",
       "  ('lock', 0.014436159438307462),\n",
       "  ('vehicle', 0.014365919790545916),\n",
       "  ('diagnose', 0.014339852909254467),\n",
       "  ('semifinished', 0.014289724084977896),\n",
       "  ('axis', 0.01410417051970944),\n",
       "  ('condition', 0.013727843087181165),\n",
       "  ('coil', 0.01361803555774846),\n",
       "  ('time', 0.013520101962259556),\n",
       "  ('output', 0.013289742650468766),\n",
       "  ('independent', 0.013282933592570424),\n",
       "  ('calculate', 0.01325614148170925),\n",
       "  ('rotation', 0.01312834304716931),\n",
       "  ('electromagnetic', 0.013014702931341462),\n",
       "  ('automobile', 0.012852195066714537),\n",
       "  ('position', 0.012833938856488756),\n",
       "  ('detailed', 0.012813273590643643),\n",
       "  ('ensure', 0.012811422671585204),\n",
       "  ('brakeequipped', 0.012765453976725967),\n",
       "  ('sensor', 0.012679945776184089),\n",
       "  ('decrease', 0.012608304096364795),\n",
       "  ('apply', 0.012441138496321906),\n",
       "  ('performance', 0.012406219172397348),\n",
       "  ('exceed', 0.012404062056150278),\n",
       "  ('controller', 0.012351840445776361),\n",
       "  ('judge', 0.012338193754293316),\n",
       "  ('speed', 0.012284851345597075),\n",
       "  ('electrify', 0.012138124385370428),\n",
       "  ('disk', 0.012113795867832247),\n",
       "  ('monitor', 0.012008365334295279),\n",
       "  ('computer', 0.012002762416756633),\n",
       "  ('valve', 0.01153428070238759),\n",
       "  ('operate', 0.011411757859132662),\n",
       "  ('program', 0.01134726663987373),\n",
       "  ('core', 0.01119607488412388),\n",
       "  ('schematic', 0.011181854700306014),\n",
       "  ('presetting', 0.011166328723355325),\n",
       "  ('acceleration', 0.01114868576813159),\n",
       "  ('safe', 0.011017641395311195),\n",
       "  ('data', 0.010757331862801877),\n",
       "  ('poweroff', 0.010508511671500577),\n",
       "  ('encoder', 0.010374840936900423),\n",
       "  ('servo', 0.010217523196709044),\n",
       "  ('relieve', 0.010115103654475356),\n",
       "  ('device', 0.010059288393247963),\n",
       "  ('mechanical', 0.010041260212633464),\n",
       "  ('industry', 0.009915602587902202),\n",
       "  ('connect', 0.009906547021209383),\n",
       "  ('opposite', 0.00967071149917057),\n",
       "  ('spring', 0.009614899461878226),\n",
       "  ('strike', 0.009614797650574778),\n",
       "  ('abnormal', 0.009603651972141206),\n",
       "  ('block', 0.009515326807416083),\n",
       "  ('energy', 0.009504632599509538),\n",
       "  ('apparatus', 0.009411831237114485),\n",
       "  ('provide', 0.009341079178723464),\n",
       "  ('hold', 0.0092979138128746),\n",
       "  ('respective', 0.009010231682949895),\n",
       "  ('deactivate', 0.008979125523156396),\n",
       "  ('motion', 0.008886919488636763),\n",
       "  ('diagram', 0.008835947089316872)],\n",
       " 17: [('magnetic', 0.22809086046012134),\n",
       "  ('field', 0.10740898191948099),\n",
       "  ('geomagnetic', 0.08996716694429613),\n",
       "  ('sensor', 0.05057506447730427),\n",
       "  ('position', 0.043957180445198495),\n",
       "  ('magic', 0.03260416445071533),\n",
       "  ('coil', 0.03200806537904388),\n",
       "  ('ferromagnetic', 0.03186880787095375),\n",
       "  ('flux', 0.026752816204741507),\n",
       "  ('estimate', 0.025842969995461373),\n",
       "  ('magnetism', 0.025359966846697373),\n",
       "  ('mobile', 0.025296146989281593),\n",
       "  ('magnet', 0.023972205269999405),\n",
       "  ('system', 0.023444149368701785),\n",
       "  ('cube', 0.022442378089576154),\n",
       "  ('robot', 0.021042283915849887),\n",
       "  ('location', 0.01964916958828549),\n",
       "  ('map', 0.018847634810219335),\n",
       "  ('fluxgate', 0.018459576628426705),\n",
       "  ('sense', 0.01777885884132712),\n",
       "  ('recognize', 0.017031362832029467),\n",
       "  ('navigation', 0.016689511248416056),\n",
       "  ('base', 0.016514130218921893),\n",
       "  ('earth', 0.016410636508730012),\n",
       "  ('freebot', 0.016071446176122592),\n",
       "  ('direction', 0.01569170935552767),\n",
       "  ('autonomous', 0.01556257108965357),\n",
       "  ('green', 0.015267372489418998),\n",
       "  ('determine', 0.01517866415859923),\n",
       "  ('method', 0.014945372793709473),\n",
       "  ('measure', 0.014609244690629573),\n",
       "  ('unit', 0.014068507778365564),\n",
       "  ('detection', 0.014004020262276762),\n",
       "  ('geophysical', 0.013392871813435493),\n",
       "  ('geomagnetism', 0.013392871813435493),\n",
       "  ('element', 0.013302343116528401),\n",
       "  ('move', 0.01322257947758897),\n",
       "  ('component', 0.013094812151653368),\n",
       "  ('tca', 0.012847190432368497),\n",
       "  ('pole', 0.012699587966300465),\n",
       "  ('angular', 0.012697733294218912),\n",
       "  ('array', 0.012385519218122216),\n",
       "  ('trajectory', 0.01220050344767983),\n",
       "  ('conductive', 0.011983569634839856),\n",
       "  ('calibrate', 0.011949171037026694),\n",
       "  ('vehicle', 0.01193744129028674),\n",
       "  ('particle', 0.01170349507585359),\n",
       "  ('body', 0.011280307627086402),\n",
       "  ('positioning', 0.011215613232406921),\n",
       "  ('signal', 0.011173274337577897),\n",
       "  ('wireless', 0.011133846856027559),\n",
       "  ('detect', 0.010925548738118964),\n",
       "  ('draw', 0.010905043255667685),\n",
       "  ('magnetometer', 0.010873975519449904),\n",
       "  ('calibration', 0.010770889422175434),\n",
       "  ('marker', 0.010748513128208945),\n",
       "  ('permeable', 0.010548329501958116),\n",
       "  ('terrestrial', 0.010539690237591789),\n",
       "  ('path', 0.010535945785583724),\n",
       "  ('disturbance', 0.010362217988688508),\n",
       "  ('advantage', 0.010317194918495606),\n",
       "  ('measurement', 0.010181650868034166),\n",
       "  ('data', 0.010113687252717463),\n",
       "  ('environment', 0.010078326274443635),\n",
       "  ('orientation', 0.010058886438605424),\n",
       "  ('set', 0.010056411146185197),\n",
       "  ('piece', 0.010044700649283516),\n",
       "  ('groundtruth', 0.009727789555563207),\n",
       "  ('landmark', 0.009709384317389222),\n",
       "  ('space', 0.009673413591447669),\n",
       "  ('shield', 0.009517913987566394),\n",
       "  ('pair', 0.009510020705366612),\n",
       "  ('shape', 0.00950126490840206),\n",
       "  ('electromagnet', 0.009479150809011447),\n",
       "  ('independent', 0.009460738165798477),\n",
       "  ('process', 0.009424639948988546),\n",
       "  ('circle', 0.009414844317141865),\n",
       "  ('material', 0.009375318086365497),\n",
       "  ('rotate', 0.009367842827803742),\n",
       "  ('provide', 0.009314426301389823),\n",
       "  ('procedure', 0.009159925224821935),\n",
       "  ('paper', 0.009119334935361411),\n",
       "  ('view', 0.009054497297645531),\n",
       "  ('distance', 0.009043148298893739),\n",
       "  ('result', 0.008955970187136184),\n",
       "  ('center', 0.008896209390157128),\n",
       "  ('accuracy', 0.00881465256669772),\n",
       "  ('involve', 0.008781153669967953),\n",
       "  ('claim', 0.008770677738650014),\n",
       "  ('surface', 0.008764635568424986),\n",
       "  ('active', 0.008706776410295684),\n",
       "  ('threeaxis', 0.008547422588797557),\n",
       "  ('simultaneously', 0.008530123667450658),\n",
       "  ('transmitter', 0.008523214284219904),\n",
       "  ('operation', 0.008497583607230684),\n",
       "  ('circuit', 0.008431570875898473),\n",
       "  ('detailed', 0.008365705274321981),\n",
       "  ('hausdorff', 0.008363138334205655),\n",
       "  ('object', 0.008282944290742772),\n",
       "  ('iron', 0.008242807355734202)],\n",
       " 18: [('cloth', 0.15568318943051718),\n",
       "  ('garment', 0.12004041227510931),\n",
       "  ('textile', 0.10715508523051312),\n",
       "  ('sew', 0.10200832059003152),\n",
       "  ('clothes', 0.07058152099856005),\n",
       "  ('fabric', 0.06754910051671986),\n",
       "  ('handle', 0.06436664819338524),\n",
       "  ('sheet', 0.03980680005397168),\n",
       "  ('fold', 0.0353732522749141),\n",
       "  ('towel', 0.0326589039437964),\n",
       "  ('paper', 0.03207216025971525),\n",
       "  ('system', 0.031310765797994654),\n",
       "  ('piece', 0.0309882601827672),\n",
       "  ('wrinkle', 0.026485678155750866),\n",
       "  ('robotic', 0.02586223504256804),\n",
       "  ('band', 0.02471691204418496),\n",
       "  ('material', 0.024611006222640123),\n",
       "  ('clothing', 0.02296751389096158),\n",
       "  ('pattern', 0.02243070394970134),\n",
       "  ('cotton', 0.021670100309250706),\n",
       "  ('flexible', 0.021219546658238022),\n",
       "  ('propose', 0.020912638657771807),\n",
       "  ('electroadhesive', 0.01975508802975649),\n",
       "  ('camera', 0.019302423694001612),\n",
       "  ('process', 0.019031138693024842),\n",
       "  ('adsorption', 0.018877467498999097),\n",
       "  ('iron', 0.018309135621257137),\n",
       "  ('robot', 0.01796337757173857),\n",
       "  ('laundry', 0.017121905813900974),\n",
       "  ('pick', 0.016450238073543757),\n",
       "  ('electrostatic', 0.016285191610365967),\n",
       "  ('collar', 0.015602260077273816),\n",
       "  ('manipulation', 0.015569367985442912),\n",
       "  ('machine', 0.015402701232832326),\n",
       "  ('model', 0.01518157680112747),\n",
       "  ('tryon', 0.015146812207361844),\n",
       "  ('humancloth', 0.015146812207361844),\n",
       "  ('spread', 0.014556813021413255),\n",
       "  ('experiment', 0.014550635632832397),\n",
       "  ('task', 0.014477126529469276),\n",
       "  ('automate', 0.014107189313265888),\n",
       "  ('shape', 0.014069635928136984),\n",
       "  ('image', 0.01406955849491958),\n",
       "  ('hanger', 0.014046618558799462),\n",
       "  ('cut', 0.014022564030144511),\n",
       "  ('blanket', 0.013718639012766487),\n",
       "  ('hand', 0.013667198593393822),\n",
       "  ('edge', 0.013615694149211672),\n",
       "  ('method', 0.013395299382251655),\n",
       "  ('fuzzy', 0.012695369800679004),\n",
       "  ('apply', 0.01265313995948793),\n",
       "  ('grasp', 0.01244984399436154),\n",
       "  ('ironing', 0.012384278589566124),\n",
       "  ('sewing', 0.012384278589566124),\n",
       "  ('approach', 0.01207660067195677),\n",
       "  ('device', 0.011935819322212606),\n",
       "  ('gripper', 0.011891687920745906),\n",
       "  ('study', 0.011889176169114522),\n",
       "  ('fit', 0.011651962353891628),\n",
       "  ('controller', 0.01157055811406334),\n",
       "  ('cutter', 0.011362902806286525),\n",
       "  ('deformation', 0.011338884990578916),\n",
       "  ('deformable', 0.011106196212854804),\n",
       "  ('ductility', 0.011070617949422991),\n",
       "  ('relationship', 0.011000784891269242),\n",
       "  ('result', 0.01071173989727384),\n",
       "  ('base', 0.010618360969180129),\n",
       "  ('characteristic', 0.010598105235511258),\n",
       "  ('industry', 0.010588796413825248),\n",
       "  ('unfold', 0.010585813851366893),\n",
       "  ('human', 0.01057714834427406),\n",
       "  ('motion', 0.010544748415664967),\n",
       "  ('automation', 0.010418783446796377),\n",
       "  ('furniture', 0.010397723586723754),\n",
       "  ('processing', 0.010344266071656746),\n",
       "  ('develop', 0.010316165651110572),\n",
       "  ('type', 0.010193198559380345),\n",
       "  ('workbench', 0.010167541392529756),\n",
       "  ('pose', 0.010129175548038563),\n",
       "  ('attach', 0.01002125844410815),\n",
       "  ('learn', 0.009982259999987123),\n",
       "  ('buckle', 0.009825441201787981),\n",
       "  ('control', 0.009714634896751123),\n",
       "  ('provide', 0.009605812902533024),\n",
       "  ('experimental', 0.009576025871433578),\n",
       "  ('depth', 0.009493173707703919),\n",
       "  ('train', 0.009491236899800413),\n",
       "  ('algorithm', 0.009300437332876792),\n",
       "  ('attachment', 0.009249392889973347),\n",
       "  ('finish', 0.009017309171741003),\n",
       "  ('parameter', 0.009000266124695636),\n",
       "  ('position', 0.00895768984813222),\n",
       "  ('servoing', 0.008938649592575185),\n",
       "  ('surface', 0.008922940520769482),\n",
       "  ('sewn', 0.008786332757796951),\n",
       "  ('wardrobe', 0.008786332757796951),\n",
       "  ('multiarm', 0.00877315133144342),\n",
       "  ('operation', 0.008763416619927522),\n",
       "  ('vision', 0.00867772942020018),\n",
       "  ('skill', 0.00865310259269876)],\n",
       " 19: [('shoe', 0.22918697580028963),\n",
       "  ('glue', 0.21683856442407207),\n",
       "  ('sole', 0.18111979561623648),\n",
       "  ('spray', 0.12438820082421641),\n",
       "  ('footwear', 0.057897627742784216),\n",
       "  ('upper', 0.0424881124347937),\n",
       "  ('track', 0.03369486917506153),\n",
       "  ('edge', 0.03341734311329741),\n",
       "  ('coat', 0.03158579249123713),\n",
       "  ('vamp', 0.03137261277383678),\n",
       "  ('process', 0.02997135542757443),\n",
       "  ('gluespraying', 0.02765479811443185),\n",
       "  ('shoelace', 0.02539712112669028),\n",
       "  ('threedimensional', 0.025335986437464937),\n",
       "  ('shoemaking', 0.025140725558574408),\n",
       "  ('curve', 0.024754994368827717),\n",
       "  ('method', 0.023847318170687512),\n",
       "  ('generate', 0.022619342722727254),\n",
       "  ('sol', 0.021572729540803713),\n",
       "  ('heel', 0.02143435068572776),\n",
       "  ('robot', 0.021187909204776385),\n",
       "  ('contour', 0.020932963037262775),\n",
       "  ('lace', 0.020797928608327593),\n",
       "  ('automatic', 0.020050028269472976),\n",
       "  ('hole', 0.019928631670801143),\n",
       "  ('production', 0.019690440224001612),\n",
       "  ('system', 0.01927911092315248),\n",
       "  ('surface', 0.01897982579038134),\n",
       "  ('outsole', 0.018198187532286643),\n",
       "  ('belt', 0.018036647562841943),\n",
       "  ('portion', 0.0180083170643208),\n",
       "  ('manufacturing', 0.01791519358263963),\n",
       "  ('manufacture', 0.016892020048971307),\n",
       "  ('cloud', 0.016855154430076357),\n",
       "  ('bond', 0.016596078715414214),\n",
       "  ('attitude', 0.016386853184466508),\n",
       "  ('perform', 0.016350068997084733),\n",
       "  ('adhesive', 0.01625293131000245),\n",
       "  ('involve', 0.016167105701224573),\n",
       "  ('overflow', 0.01612947728736188),\n",
       "  ('data', 0.015621833796692625),\n",
       "  ('spraying', 0.015421434348513669),\n",
       "  ('accord', 0.015278481419912204),\n",
       "  ('scan', 0.01488538734056966),\n",
       "  ('toe', 0.014864108128134736),\n",
       "  ('boundary', 0.014439747726123758),\n",
       "  ('path', 0.013820988203899555),\n",
       "  ('model', 0.013662193812152647),\n",
       "  ('object', 0.013600372322581886),\n",
       "  ('instruction', 0.013386860592138625),\n",
       "  ('plasma', 0.013368275117351228),\n",
       "  ('operation', 0.013346160656039122),\n",
       "  ('conveyor', 0.013202407165593935),\n",
       "  ('candyshaped', 0.013178317224836696),\n",
       "  ('profile', 0.01314048292966026),\n",
       "  ('enable', 0.013103515130116589),\n",
       "  ('remove', 0.01299881631395984),\n",
       "  ('processing', 0.012889390951645305),\n",
       "  ('material', 0.012777645715330478),\n",
       "  ('acquire', 0.012424360224271907),\n",
       "  ('arm', 0.012273374772684286),\n",
       "  ('draw', 0.012046457239014405),\n",
       "  ('control', 0.011980308572189865),\n",
       "  ('advantage', 0.01193979780933472),\n",
       "  ('enterprise', 0.01137079982428905),\n",
       "  ('realize', 0.011272117671236707),\n",
       "  ('claim', 0.011270518090309514),\n",
       "  ('jump', 0.011162703446876126),\n",
       "  ('blockingproof', 0.011144851192385978),\n",
       "  ('controller', 0.01110673966935109),\n",
       "  ('coordinate', 0.011044291558427321),\n",
       "  ('station', 0.010971124371519994),\n",
       "  ('pulling', 0.010904726786898114),\n",
       "  ('base', 0.010858713479194955),\n",
       "  ('joint', 0.010854667808369469),\n",
       "  ('cotton', 0.01083407848839321),\n",
       "  ('independent', 0.010806454448192887),\n",
       "  ('view', 0.01069501178833837),\n",
       "  ('detailed', 0.010641532304093872),\n",
       "  ('extract', 0.010621737148737837),\n",
       "  ('camera', 0.010573422952007762),\n",
       "  ('image', 0.010551222573201057),\n",
       "  ('position', 0.010479557251709163),\n",
       "  ('finish', 0.010433379169655362),\n",
       "  ('rough', 0.01042117988300509),\n",
       "  ('device', 0.01017594383402604),\n",
       "  ('set', 0.010051000109786925),\n",
       "  ('target', 0.009859957292209478),\n",
       "  ('dimensional', 0.009479788484921552),\n",
       "  ('assembly', 0.009421917642530161),\n",
       "  ('efficiency', 0.009395470366783636),\n",
       "  ('guide', 0.009257664219171225),\n",
       "  ('automatically', 0.009218399156458924),\n",
       "  ('posture', 0.009166790262192241),\n",
       "  ('initial', 0.009123452102396597),\n",
       "  ('component', 0.008997839295421625),\n",
       "  ('nonenglish', 0.008927385941497243),\n",
       "  ('step', 0.008912250437177595),\n",
       "  ('text', 0.008686977222184668),\n",
       "  ('plane', 0.00860593455439898)],\n",
       " 20: [('medicine', 0.4517408063351853),\n",
       "  ('pharmacy', 0.07923947529866984),\n",
       "  ('medication', 0.07909229060542548),\n",
       "  ('drug', 0.07257097037054773),\n",
       "  ('storage', 0.059882100093471294),\n",
       "  ('delivery', 0.055002436312188034),\n",
       "  ('store', 0.04166805200020052),\n",
       "  ('dispense', 0.03711614076401286),\n",
       "  ('vial', 0.03542559562764188),\n",
       "  ('pharmaceutical', 0.034090926372820456),\n",
       "  ('dosage', 0.03078758305748116),\n",
       "  ('drawer', 0.03052718750044628),\n",
       "  ('basket', 0.03045668584309005),\n",
       "  ('dose', 0.029743537966115983),\n",
       "  ('box', 0.0296262569195186),\n",
       "  ('automatic', 0.02880945910886997),\n",
       "  ('deliver', 0.028767430021799323),\n",
       "  ('method', 0.028402341935053428),\n",
       "  ('management', 0.02779725932449431),\n",
       "  ('ointment', 0.02272277242365978),\n",
       "  ('item', 0.022044037571250962),\n",
       "  ('hospital', 0.021165383637284433),\n",
       "  ('user', 0.02115412299087287),\n",
       "  ('manage', 0.02114438010794725),\n",
       "  ('bottle', 0.020139216496954805),\n",
       "  ('involve', 0.019911574516716945),\n",
       "  ('checkexception', 0.019783108861595566),\n",
       "  ('robotbased', 0.019613340338821967),\n",
       "  ('stopper', 0.019271743808882764),\n",
       "  ('receive', 0.019249577743666313),\n",
       "  ('system', 0.01899548185589338),\n",
       "  ('medical', 0.018808419814898194),\n",
       "  ('device', 0.0187991964369159),\n",
       "  ('robot', 0.018556620811817408),\n",
       "  ('station', 0.01842565935701239),\n",
       "  ('accord', 0.018120204714713633),\n",
       "  ('control', 0.01794535770357439),\n",
       "  ('unit', 0.017317596552892004),\n",
       "  ('draw', 0.01695604716743976),\n",
       "  ('cabinet', 0.016467383847742156),\n",
       "  ('highvolume', 0.015814218839048697),\n",
       "  ('power', 0.01566586122670807),\n",
       "  ('instruction', 0.015517549080724833),\n",
       "  ('route', 0.015452531529595477),\n",
       "  ('protector', 0.015337647879729913),\n",
       "  ('outermost', 0.01508228872487284),\n",
       "  ('schedule', 0.015068353709413932),\n",
       "  ('distribution', 0.014837648755968996),\n",
       "  ('position', 0.014395969246488833),\n",
       "  ('people', 0.014336672840559886),\n",
       "  ('magic', 0.01433357840272738),\n",
       "  ('illustrate', 0.014066619739133309),\n",
       "  ('slot', 0.014050985515881432),\n",
       "  ('advantage', 0.014036761214579797),\n",
       "  ('mobile', 0.01383921450043165),\n",
       "  ('liquid', 0.01342766019438527),\n",
       "  ('chinese', 0.013412681610641535),\n",
       "  ('rectangular', 0.013405217211994763),\n",
       "  ('cap', 0.013372833205171871),\n",
       "  ('trough', 0.013343363068706945),\n",
       "  ('tobeidentified', 0.013262557446192423),\n",
       "  ('assembly', 0.013261864196642851),\n",
       "  ('mechanical', 0.013205355130530888),\n",
       "  ('tobestored', 0.013111894758777097),\n",
       "  ('claim', 0.013109726227975991),\n",
       "  ('grab', 0.012788749078898869),\n",
       "  ('mark', 0.012482957182083),\n",
       "  ('container', 0.01245737590810736),\n",
       "  ('vacancy', 0.01238543100082453),\n",
       "  ('send', 0.012138139975040207),\n",
       "  ('time', 0.012123008469231924),\n",
       "  ('batch', 0.012077608007004461),\n",
       "  ('quantity', 0.011873676345718462),\n",
       "  ('conveyor', 0.01182561538273695),\n",
       "  ('operate', 0.011791771664580918),\n",
       "  ('packaging', 0.011704692354316691),\n",
       "  ('independent', 0.011645673388317212),\n",
       "  ('diagram', 0.011620236579688092),\n",
       "  ('absorb', 0.011281056564089247),\n",
       "  ('weight', 0.011231115178460692),\n",
       "  ('single', 0.011170937496391828),\n",
       "  ('sterile', 0.011147294293425139),\n",
       "  ('comprise', 0.011073602507823896),\n",
       "  ('enable', 0.01104208005654431),\n",
       "  ('office', 0.01076391718281953),\n",
       "  ('target', 0.010714963529161101),\n",
       "  ('tshaped', 0.010674690454965557),\n",
       "  ('redesign', 0.010610045956953938),\n",
       "  ('regularly', 0.010461022420198205),\n",
       "  ('cylinder', 0.010398231617963763),\n",
       "  ('idle', 0.010370663013438506),\n",
       "  ('mechanism', 0.01037005224026006),\n",
       "  ('reduce', 0.010325099816797129),\n",
       "  ('boxpacked', 0.010294585457778001),\n",
       "  ('pack', 0.010151503371973266),\n",
       "  ('nonenglish', 0.010149286907644975),\n",
       "  ('person', 0.010105668912826448),\n",
       "  ('product', 0.010102926696149503),\n",
       "  ('staff', 0.010053313133125477),\n",
       "  ('andor', 0.00994549877429478)],\n",
       " 21: [('substation', 0.2631348072526147),\n",
       "  ('inspection', 0.15969592404999491),\n",
       "  ('transformer', 0.12153866162165018),\n",
       "  ('meter', 0.05462115517656231),\n",
       "  ('equipment', 0.03504467153233279),\n",
       "  ('insulator', 0.02975690778259843),\n",
       "  ('robot', 0.027496151721142916),\n",
       "  ('data', 0.025122745818187596),\n",
       "  ('image', 0.02413651555821257),\n",
       "  ('monitor', 0.02384729411178723),\n",
       "  ('method', 0.02339408530334632),\n",
       "  ('system', 0.02217514031448616),\n",
       "  ('device', 0.022079445830208107),\n",
       "  ('operation', 0.021662150774704802),\n",
       "  ('frame', 0.021649060028250764),\n",
       "  ('identification', 0.021615912271389853),\n",
       "  ('intelligent', 0.02126820012522439),\n",
       "  ('inspect', 0.02101008311811045),\n",
       "  ('pointer', 0.020933258232532326),\n",
       "  ('temperature', 0.020812302256744367),\n",
       "  ('power', 0.019652962734214467),\n",
       "  ('patrol', 0.019035659222860768),\n",
       "  ('appliance', 0.01888067392155673),\n",
       "  ('monitoring', 0.0185007785231885),\n",
       "  ('module', 0.01838245612582279),\n",
       "  ('test', 0.018035949936025208),\n",
       "  ('fire', 0.017657893686412907),\n",
       "  ('electric', 0.0176435566840238),\n",
       "  ('distribution', 0.017109804187582272),\n",
       "  ('realize', 0.01707060870385877),\n",
       "  ('rout', 0.01662678077080074),\n",
       "  ('collect', 0.01633938988403454),\n",
       "  ('read', 0.0157738115614005),\n",
       "  ('maintenance', 0.01558635261298573),\n",
       "  ('instrument', 0.015301448995737635),\n",
       "  ('keyprogramming', 0.015210473381454629),\n",
       "  ('charge', 0.015092786670364976),\n",
       "  ('highvoltage', 0.014966450953864093),\n",
       "  ('transfer', 0.01480511145463446),\n",
       "  ('video', 0.014145245910379481),\n",
       "  ('detection', 0.01388303419710015),\n",
       "  ('realtime', 0.01387620316318261),\n",
       "  ('management', 0.01385189755410631),\n",
       "  ('scene', 0.01376362162370251),\n",
       "  ('solve', 0.0137328151860845),\n",
       "  ('control', 0.013729913625382601),\n",
       "  ('component', 0.013691616765815146),\n",
       "  ('unit', 0.0135507439962874),\n",
       "  ('involve', 0.013401564774008192),\n",
       "  ('bear', 0.013353976839380064),\n",
       "  ('advantage', 0.013323394913628685),\n",
       "  ('anchor', 0.013317472806679824),\n",
       "  ('time', 0.013180632684530272),\n",
       "  ('position', 0.013043240824348034),\n",
       "  ('nonenglish', 0.013027101823367186),\n",
       "  ('draw', 0.012802299197271388),\n",
       "  ('flush', 0.01279486399177493),\n",
       "  ('text', 0.012676290411579498),\n",
       "  ('language', 0.012547521996276314),\n",
       "  ('transshipment', 0.012436328994926051),\n",
       "  ('rtv', 0.012424397981659984),\n",
       "  ('water', 0.01241528063683954),\n",
       "  ('network', 0.012348094047509242),\n",
       "  ('real', 0.012342744842260578),\n",
       "  ('process', 0.011944453416423013),\n",
       "  ('path', 0.011750536953900792),\n",
       "  ('angle', 0.011701159348945073),\n",
       "  ('infrared', 0.01169603102748174),\n",
       "  ('body', 0.011612962474089826),\n",
       "  ('tracktype', 0.011604007901103823),\n",
       "  ('scheme', 0.011556781695580248),\n",
       "  ('insulation', 0.011532022510547357),\n",
       "  ('accord', 0.01136597927305387),\n",
       "  ('manage', 0.011175227012921386),\n",
       "  ('base', 0.011147670658058913),\n",
       "  ('provide', 0.011130214127995626),\n",
       "  ('improve', 0.011083605829616535),\n",
       "  ('deep', 0.01073387185522257),\n",
       "  ('aerial', 0.010611478999248183),\n",
       "  ('key', 0.010582535549918783),\n",
       "  ('vehicle', 0.010460684014400817),\n",
       "  ('processor', 0.01008917311255875),\n",
       "  ('submersible', 0.010057700595108961),\n",
       "  ('platform', 0.00988029619923233),\n",
       "  ('accuracy', 0.009830811853882326),\n",
       "  ('background', 0.009816534236088146),\n",
       "  ('smart', 0.009811047170060202),\n",
       "  ('perform', 0.009773964242102966),\n",
       "  ('spray', 0.00963905864237492),\n",
       "  ('refers', 0.009428021145811977),\n",
       "  ('inclination', 0.009323378604622208),\n",
       "  ('performance', 0.00923902054473977),\n",
       "  ('condition', 0.009200920949362023),\n",
       "  ('source', 0.009120302996576247),\n",
       "  ('dial', 0.009052483076983206),\n",
       "  ('model', 0.009034301682248043),\n",
       "  ('analyze', 0.009025181933833502),\n",
       "  ('short', 0.009024267221565067),\n",
       "  ('set', 0.008972576981825998),\n",
       "  ('route', 0.008909423353462897)],\n",
       " 22: [('sterilize', 0.2578995046325108),\n",
       "  ('disinfection', 0.2098501825596082),\n",
       "  ('disinfect', 0.10064880422690692),\n",
       "  ('clean', 0.059063004239202826),\n",
       "  ('epidemic', 0.05562170759908014),\n",
       "  ('spray', 0.05293665923787994),\n",
       "  ('liquid', 0.04431534489119377),\n",
       "  ('livestock', 0.04272576386643799),\n",
       "  ('prevention', 0.04243661887625299),\n",
       "  ('sterilization', 0.04237844388501344),\n",
       "  ('disinfectant', 0.03951914506947553),\n",
       "  ('robot', 0.03376187344707258),\n",
       "  ('device', 0.03110990096768526),\n",
       "  ('control', 0.030776811767260732),\n",
       "  ('poultry', 0.027792607713927827),\n",
       "  ('house', 0.02647369332473564),\n",
       "  ('method', 0.026219952269665742),\n",
       "  ('sweep', 0.025031421875567204),\n",
       "  ('environment', 0.02249626400545454),\n",
       "  ('preset', 0.022011342666447074),\n",
       "  ('accord', 0.021939255004389403),\n",
       "  ('space', 0.021393126211855424),\n",
       "  ('detect', 0.02094063508139468),\n",
       "  ('time', 0.019697033410574397),\n",
       "  ('supplement', 0.01946831500057762),\n",
       "  ('wash', 0.01941583624220219),\n",
       "  ('mobile', 0.01932344561681233),\n",
       "  ('interior', 0.019177232139494783),\n",
       "  ('involve', 0.017908931826908323),\n",
       "  ('navigate', 0.017781519817780728),\n",
       "  ('public', 0.017634154162906722),\n",
       "  ('storage', 0.01762578052958983),\n",
       "  ('limit', 0.017515863286651934),\n",
       "  ('sensor', 0.017498069182995894),\n",
       "  ('wall', 0.017449760670286845),\n",
       "  ('surround', 0.017378654544415995),\n",
       "  ('floor', 0.017335478107734916),\n",
       "  ('bacteria', 0.016840491046104626),\n",
       "  ('cleaning', 0.016759801878193585),\n",
       "  ('lethal', 0.016741089766794365),\n",
       "  ('automatic', 0.016717351968961656),\n",
       "  ('target', 0.015958517686904004),\n",
       "  ('distance', 0.015414457327659779),\n",
       "  ('upper', 0.015382264761647394),\n",
       "  ('concentration', 0.015290381204620306),\n",
       "  ('microcontroller', 0.015229610386157246),\n",
       "  ('air', 0.015229025068186656),\n",
       "  ('book', 0.01503401876704373),\n",
       "  ('draw', 0.01434874112587853),\n",
       "  ('irradiation', 0.014182381750699292),\n",
       "  ('trigger', 0.013981819609095012),\n",
       "  ('contaminate', 0.013681008838556975),\n",
       "  ('advantage', 0.013575256471704744),\n",
       "  ('lamp', 0.013352743814498524),\n",
       "  ('endurance', 0.013351801208261871),\n",
       "  ('route', 0.01283866577165277),\n",
       "  ('excrement', 0.012733419826024764),\n",
       "  ('dose', 0.012584959284115361),\n",
       "  ('smart', 0.012567044077473766),\n",
       "  ('claim', 0.012529539626642876),\n",
       "  ('wheel', 0.012326430613546834),\n",
       "  ('comprise', 0.012267269926078251),\n",
       "  ('bio', 0.012159736944454009),\n",
       "  ('autonomous', 0.012158258663791853),\n",
       "  ('operation', 0.012139405153186691),\n",
       "  ('animal', 0.01205374142157853),\n",
       "  ('base', 0.011951015290009264),\n",
       "  ('light', 0.01192960764467622),\n",
       "  ('adjust', 0.011862501626560185),\n",
       "  ('strategy', 0.011856797620576657),\n",
       "  ('independent', 0.011825922707248096),\n",
       "  ('user', 0.011717204793794383),\n",
       "  ('path', 0.0115236907029822),\n",
       "  ('medium', 0.011520513909173302),\n",
       "  ('reduce', 0.011438083169127762),\n",
       "  ('injection', 0.011221159874497328),\n",
       "  ('nonenglish', 0.011165240089012533),\n",
       "  ('step', 0.011146310523213026),\n",
       "  ('mileage', 0.011049582066315504),\n",
       "  ('virus', 0.010908925103616268),\n",
       "  ('indoor', 0.010877884639251567),\n",
       "  ('text', 0.010864567407422749),\n",
       "  ('obstacle', 0.010829158046008465),\n",
       "  ('electronic', 0.010802849109913385),\n",
       "  ('improve', 0.010766114473752461),\n",
       "  ('language', 0.010754202854183225),\n",
       "  ('sterilizing', 0.010744307296835807),\n",
       "  ('amr', 0.010711676378269204),\n",
       "  ('remain', 0.010637819468171173),\n",
       "  ('ultravioletc', 0.01045392291775707),\n",
       "  ('system', 0.010386648454488133),\n",
       "  ('interface', 0.010338141467650445),\n",
       "  ('module', 0.010301473983027543),\n",
       "  ('selfreliant', 0.010228685094271609),\n",
       "  ('store', 0.010118321656494358),\n",
       "  ('andor', 0.010099433142941336),\n",
       "  ('contamination', 0.01001229934317748),\n",
       "  ('instruction', 0.009848579055692199),\n",
       "  ('operate', 0.009797140032832096),\n",
       "  ('ensure', 0.009776684595947256)],\n",
       " 23: [('paint', 0.20165565435019164),\n",
       "  ('painting', 0.16522549956569996),\n",
       "  ('artwork', 0.13690878301022302),\n",
       "  ('artistic', 0.097791987864445),\n",
       "  ('artist', 0.08355955264104978),\n",
       "  ('style', 0.06330657303202139),\n",
       "  ('render', 0.06323888156946172),\n",
       "  ('robotic', 0.05916024164925075),\n",
       "  ('canvas', 0.05891360026197178),\n",
       "  ('art', 0.05794869259602339),\n",
       "  ('rendering', 0.057078695876471984),\n",
       "  ('color', 0.05428317483225535),\n",
       "  ('technique', 0.0510021145713739),\n",
       "  ('watercolour', 0.05035707058689809),\n",
       "  ('stroke', 0.049389273733394336),\n",
       "  ('image', 0.04827648185207239),\n",
       "  ('create', 0.04628505260744557),\n",
       "  ('nonphotorealistic', 0.04531412698543591),\n",
       "  ('human', 0.043363151863301974),\n",
       "  ('brushstrokes', 0.03499731684894222),\n",
       "  ('rendition', 0.03445519703966097),\n",
       "  ('interactive', 0.03435627787775887),\n",
       "  ('algorithm', 0.03149788418901122),\n",
       "  ('paper', 0.031442372822024486),\n",
       "  ('palette', 0.029978681329380277),\n",
       "  ('brushstroke', 0.029698761332722957),\n",
       "  ('tone', 0.02823928234791045),\n",
       "  ('avatar', 0.028071830441594482),\n",
       "  ('texture', 0.02573601558993905),\n",
       "  ('collaborative', 0.024987968198349742),\n",
       "  ('child', 0.024884749418755438),\n",
       "  ('robocodraw', 0.024282187504161005),\n",
       "  ('busker', 0.024282187504161005),\n",
       "  ('reproduce', 0.023475876580148963),\n",
       "  ('system', 0.023264283441688877),\n",
       "  ('cybernetic', 0.022970131359773976),\n",
       "  ('produce', 0.022671707288470462),\n",
       "  ('region', 0.020217065972287323),\n",
       "  ('visual', 0.019747548468753713),\n",
       "  ('aesthetic', 0.01972012554370285),\n",
       "  ('acrylic', 0.019558397572889),\n",
       "  ('machine', 0.01954149340949126),\n",
       "  ('algorithmic', 0.019131026218833454),\n",
       "  ('experimental', 0.018775971008174276),\n",
       "  ('knife', 0.018395185393743317),\n",
       "  ('generative', 0.018137677348525463),\n",
       "  ('input', 0.01785639092554863),\n",
       "  ('learn', 0.017615236652966725),\n",
       "  ('draw', 0.017497726282695015),\n",
       "  ('reproduction', 0.01734917212761797),\n",
       "  ('stage', 0.01700770067085153),\n",
       "  ('result', 0.01650219684810714),\n",
       "  ('creativity', 0.016279843364955995),\n",
       "  ('international', 0.01596540619480485),\n",
       "  ('generate', 0.015897609367389706),\n",
       "  ('propose', 0.015770758479179074),\n",
       "  ('robot', 0.015729890546007885),\n",
       "  ('realistic', 0.015480211337284305),\n",
       "  ('team', 0.0149881195509192),\n",
       "  ('gan', 0.014728400065492945),\n",
       "  ('picture', 0.0145030837414321),\n",
       "  ('brush', 0.014481479942470737),\n",
       "  ('exhibition', 0.014207556525705649),\n",
       "  ('process', 0.013993074207539879),\n",
       "  ('computer', 0.013962181721016138),\n",
       "  ('sequence', 0.013937421896722913),\n",
       "  ('density', 0.013927586790346514),\n",
       "  ('adversarial', 0.013735982116960197),\n",
       "  ('challenge', 0.013613269476317072),\n",
       "  ('multifingered', 0.013571586450066892),\n",
       "  ('setup', 0.013145162917265224),\n",
       "  ('transfer', 0.012646936686243835),\n",
       "  ('planning', 0.01263369932072841),\n",
       "  ('apply', 0.012404675605066567),\n",
       "  ('trajectory', 0.012398362335166627),\n",
       "  ('scatter', 0.012385127287975684),\n",
       "  ('desire', 0.012272782409076326),\n",
       "  ('corobotic', 0.012141093752080502),\n",
       "  ('colorful', 0.011879504533089183),\n",
       "  ('approach', 0.0118394575755262),\n",
       "  ('basic', 0.011788428723056896),\n",
       "  ('capable', 0.011610248814890173),\n",
       "  ('path', 0.01147158223723433),\n",
       "  ('appearance', 0.011335087582939447),\n",
       "  ('monochromatic', 0.011328531746358977),\n",
       "  ('painter', 0.011190460130421798),\n",
       "  ('pictorial', 0.011190460130421798),\n",
       "  ('feedback', 0.011144258710089451),\n",
       "  ('original', 0.010960120878898048),\n",
       "  ('regionbased', 0.010955225896977852),\n",
       "  ('heterogeneous', 0.01090863417387165),\n",
       "  ('timeefficient', 0.010759401523494467),\n",
       "  ('robotized', 0.010750794970923176),\n",
       "  ('mix', 0.0107445173194017),\n",
       "  ('study', 0.010596103134841755),\n",
       "  ('finally', 0.01053863994365772),\n",
       "  ('bv', 0.01046694973959442),\n",
       "  ('fair', 0.010314569236302132),\n",
       "  ('interactively', 0.010197256732802053),\n",
       "  ('sculpture', 0.01014272910185961)],\n",
       " 24: [('steel', 0.12909894265981073),\n",
       "  ('iron', 0.12559095260588504),\n",
       "  ('alloy', 0.1119462053969168),\n",
       "  ('core', 0.08189408815272156),\n",
       "  ('temperature', 0.07186591214842528),\n",
       "  ('titanium', 0.06783568024213911),\n",
       "  ('ingot', 0.06646545856958032),\n",
       "  ('nickel', 0.06437741595778779),\n",
       "  ('furnace', 0.06354588374805337),\n",
       "  ('grain', 0.05944429123054335),\n",
       "  ('cast', 0.05665998639745052),\n",
       "  ('melt', 0.05381881039684172),\n",
       "  ('hafnium', 0.05218183307530909),\n",
       "  ('carbon', 0.05054503794710519),\n",
       "  ('material', 0.047742771535869914),\n",
       "  ('silicon', 0.04494398418993485),\n",
       "  ('molybdenum', 0.04345614558521424),\n",
       "  ('smelt', 0.043326787756357225),\n",
       "  ('slab', 0.042942959382484804),\n",
       "  ('degree', 0.04284969020405324),\n",
       "  ('chromium', 0.040091072076655646),\n",
       "  ('forge', 0.037297938513370356),\n",
       "  ('manganese', 0.03703654529738596),\n",
       "  ('hammer', 0.03651987814035763),\n",
       "  ('heat', 0.0360673015340539),\n",
       "  ('agent', 0.03407456086487221),\n",
       "  ('magnesium', 0.0334139793334047),\n",
       "  ('molten', 0.032890026784067446),\n",
       "  ('add', 0.03242839027259117),\n",
       "  ('vanadium', 0.032241992643010614),\n",
       "  ('rare', 0.03157500040034067),\n",
       "  ('powder', 0.031434941792231615),\n",
       "  ('minute', 0.031323806955113935),\n",
       "  ('crystal', 0.031248724088799654),\n",
       "  ('spheroidizing', 0.030999060491961158),\n",
       "  ('cool', 0.02969243090606474),\n",
       "  ('earth', 0.028599289800933115),\n",
       "  ('comprise', 0.028402897889762805),\n",
       "  ('sand', 0.028025844196893124),\n",
       "  ('reactor', 0.025621297559150963),\n",
       "  ('stainless', 0.025358224601019237),\n",
       "  ('wearresistant', 0.02460609976577946),\n",
       "  ('equal', 0.024324541619630595),\n",
       "  ('hour', 0.024294546058052726),\n",
       "  ('strength', 0.024263282427429065),\n",
       "  ('stir', 0.023967745362397885),\n",
       "  ('diesel', 0.023134935320230435),\n",
       "  ('slag', 0.021605220944027996),\n",
       "  ('dip', 0.02154004696734551),\n",
       "  ('sulfur', 0.021494661762007077),\n",
       "  ('pour', 0.021294759674078963),\n",
       "  ('carbide', 0.02062721128021458),\n",
       "  ('minus', 0.02056438695131594),\n",
       "  ('plate', 0.020197870698062684),\n",
       "  ('layer', 0.019985234615234965),\n",
       "  ('phase', 0.019930607995106094),\n",
       "  ('treatment', 0.01922627405206192),\n",
       "  ('aluminum', 0.019088533105370675),\n",
       "  ('phosphorus', 0.019072012016919573),\n",
       "  ('surface', 0.0188202223096118),\n",
       "  ('highstrength', 0.018576639795102854),\n",
       "  ('remove', 0.01854458831412003),\n",
       "  ('mainphase', 0.018005254084528174),\n",
       "  ('anneal', 0.017914893449323014),\n",
       "  ('wire', 0.017536115572985834),\n",
       "  ('spheroidization', 0.017484748334700016),\n",
       "  ('flexible', 0.017124097363523806),\n",
       "  ('refining', 0.01690857845016063),\n",
       "  ('ultrahighstrength', 0.01690857845016063),\n",
       "  ('preparation', 0.016862164870521813),\n",
       "  ('cobalt', 0.016751153667439643),\n",
       "  ('resistance', 0.016490715760681507),\n",
       "  ('heating', 0.016254559820714998),\n",
       "  ('gas', 0.015986653426474755),\n",
       "  ('entropy', 0.01588647093701334),\n",
       "  ('zinc', 0.015647588165617784),\n",
       "  ('engine', 0.015493990782107525),\n",
       "  ('harmonic', 0.015479795608932244),\n",
       "  ('permanent', 0.015422033747809502),\n",
       "  ('yttriumceriumbased', 0.015279278297233223),\n",
       "  ('rl40', 0.015279278297233223),\n",
       "  ('deoxidizer', 0.015279278297233223),\n",
       "  ('yttriumceriumcontaining', 0.015279278297233223),\n",
       "  ('industrial', 0.015228279714487682),\n",
       "  ('calcium', 0.01515479524229853),\n",
       "  ('bag', 0.015081986851978096),\n",
       "  ('metal', 0.014855208290020547),\n",
       "  ('prepare', 0.014590102963274407),\n",
       "  ('inoculant', 0.014570623612250012),\n",
       "  ('coat', 0.01442443257817554),\n",
       "  ('magnet', 0.014323561331410982),\n",
       "  ('shot', 0.01422767469686557),\n",
       "  ('ductile', 0.014090482041800525),\n",
       "  ('oxygen', 0.013932479846327141),\n",
       "  ('size', 0.013819287364000496),\n",
       "  ('niobium', 0.013726884008343255),\n",
       "  ('low', 0.01371628044109536),\n",
       "  ('electric', 0.013633359774167969),\n",
       "  ('pig', 0.013560934541837308),\n",
       "  ('wheel', 0.0135027365506659)],\n",
       " 25: [('tire', 0.5246541787806963),\n",
       "  ('rim', 0.09199991720604522),\n",
       "  ('wheel', 0.052417130536825264),\n",
       "  ('test', 0.04352646130559734),\n",
       "  ('sealant', 0.04027978350225457),\n",
       "  ('assembly', 0.03887796167549357),\n",
       "  ('drum', 0.038839883775749276),\n",
       "  ('anthropomorphic', 0.03419027680232193),\n",
       "  ('move', 0.03271883842755974),\n",
       "  ('robotized', 0.03257700927245993),\n",
       "  ('composition', 0.032220851985894645),\n",
       "  ('rail', 0.031226395309231107),\n",
       "  ('method', 0.028547380537297263),\n",
       "  ('green', 0.027984156699324837),\n",
       "  ('vehicle', 0.026725586573042682),\n",
       "  ('tirewheel', 0.0265121769734882),\n",
       "  ('form', 0.02624338133821611),\n",
       "  ('arm', 0.025782410641891847),\n",
       "  ('grip', 0.025483936189600792),\n",
       "  ('roller', 0.02481026826278847),\n",
       "  ('involve', 0.022872290747824816),\n",
       "  ('sort', 0.022083973374826274),\n",
       "  ('linear', 0.021990918484570365),\n",
       "  ('provide', 0.02195070648925602),\n",
       "  ('coordinate', 0.021701150153659365),\n",
       "  ('local', 0.021146818187028387),\n",
       "  ('mount', 0.021082364390085127),\n",
       "  ('image', 0.020898167480242452),\n",
       "  ('select', 0.020392936349093796),\n",
       "  ('balance', 0.02019986365311989),\n",
       "  ('machine', 0.020186776051545344),\n",
       "  ('mold', 0.01953243827507374),\n",
       "  ('bead', 0.01947241973793001),\n",
       "  ('surface', 0.019278046854173368),\n",
       "  ('mark', 0.018587707112456334),\n",
       "  ('light', 0.017492990882167814),\n",
       "  ('instal', 0.017484567948950286),\n",
       "  ('coat', 0.01737779613527655),\n",
       "  ('displaces', 0.01716383229066467),\n",
       "  ('nozzle', 0.017067932624383896),\n",
       "  ('heavyduty', 0.01698212196491654),\n",
       "  ('crush', 0.016909355679552467),\n",
       "  ('lubrication', 0.015932777931459394),\n",
       "  ('road', 0.01583184790536425),\n",
       "  ('cone', 0.015637231463355918),\n",
       "  ('heavy', 0.015581750875934768),\n",
       "  ('clamp', 0.014933766461753524),\n",
       "  ('assemble', 0.014910550788538297),\n",
       "  ('structure', 0.014755826948537687),\n",
       "  ('character', 0.01467071570317038),\n",
       "  ('cutter', 0.014466725407394732),\n",
       "  ('set', 0.014377571826673003),\n",
       "  ('draw', 0.014202195368376217),\n",
       "  ('yaxis', 0.014090159329942233),\n",
       "  ('manipulator', 0.014032246124208194),\n",
       "  ('zaxis', 0.013982505241442877),\n",
       "  ('position', 0.013970535599068556),\n",
       "  ('sleeve', 0.013963482422891978),\n",
       "  ('undergoing', 0.01379620733196004),\n",
       "  ('stack', 0.013756185777351103),\n",
       "  ('rotate', 0.013736544742565976),\n",
       "  ('waste', 0.013663815687365811),\n",
       "  ('construction', 0.013574334697410038),\n",
       "  ('unload', 0.013566749641887576),\n",
       "  ('attitude', 0.013523519823859239),\n",
       "  ('actuator', 0.013507712511127961),\n",
       "  ('lateral', 0.013495744078235984),\n",
       "  ('claim', 0.013435038105433342),\n",
       "  ('robot', 0.013211395251042186),\n",
       "  ('movement', 0.013197882239085548),\n",
       "  ('direction', 0.012942873058566895),\n",
       "  ('arrange', 0.01293670686686003),\n",
       "  ('piece', 0.012887923839777868),\n",
       "  ('suspension', 0.012575521418908319),\n",
       "  ('strip', 0.012570157945929052),\n",
       "  ('displace', 0.012542348681926437),\n",
       "  ('advantage', 0.012540836395974489),\n",
       "  ('rotation', 0.012458831632719804),\n",
       "  ('cantilever', 0.012430900518683804),\n",
       "  ('diameter', 0.012395801139380375),\n",
       "  ('passenger', 0.012282939227956946),\n",
       "  ('independent', 0.012262530612324117),\n",
       "  ('blank', 0.012182908882071419),\n",
       "  ('data', 0.01213381176936715),\n",
       "  ('ratchet', 0.012127446013765426),\n",
       "  ('threedimensional', 0.011947965184985686),\n",
       "  ('grasp', 0.011767846646535421),\n",
       "  ('command', 0.011745054447475747),\n",
       "  ('platform', 0.011691391346231933),\n",
       "  ('station', 0.011523400816348244),\n",
       "  ('free', 0.01150128887940143),\n",
       "  ('center', 0.011414344049291302),\n",
       "  ('mechanical', 0.01137667647981096),\n",
       "  ('process', 0.011307133024541402),\n",
       "  ('zone', 0.011157579710602468),\n",
       "  ('unstacking', 0.011112331125449145),\n",
       "  ('pattern', 0.011105788145611454),\n",
       "  ('apparatus', 0.011058483771494194),\n",
       "  ('car', 0.011041417825250454),\n",
       "  ('view', 0.010863057471581833)],\n",
       " 26: [('chess', 0.4039420178336737),\n",
       "  ('chessboard', 0.18415696891473263),\n",
       "  ('chessman', 0.13870041658574508),\n",
       "  ('game', 0.10513232442319692),\n",
       "  ('image', 0.10494352451533576),\n",
       "  ('play', 0.09067557954272386),\n",
       "  ('process', 0.04380217357442759),\n",
       "  ('portion', 0.03950351734582781),\n",
       "  ('move', 0.036303124363354936),\n",
       "  ('decision', 0.03424055827594793),\n",
       "  ('board', 0.03418376075202668),\n",
       "  ('attribute', 0.033058093656699476),\n",
       "  ('difficulty', 0.030544233610791876),\n",
       "  ('method', 0.03028457942706576),\n",
       "  ('piece', 0.02958573342220159),\n",
       "  ('perform', 0.02876262137789906),\n",
       "  ('accord', 0.02787297544801516),\n",
       "  ('tobemoved', 0.027839967811416656),\n",
       "  ('level', 0.02756336382873841),\n",
       "  ('subchessman', 0.025823693595119965),\n",
       "  ('gambit', 0.025823693595119965),\n",
       "  ('processing', 0.02441889203224546),\n",
       "  ('camera', 0.024323722983632536),\n",
       "  ('computer', 0.024280817549493922),\n",
       "  ('marker', 0.0228960586417983),\n",
       "  ('data', 0.022631847181447035),\n",
       "  ('determine', 0.022353673204461032),\n",
       "  ('recognition', 0.022017461736897517),\n",
       "  ('device', 0.021420309905467658),\n",
       "  ('scene', 0.021242991209597377),\n",
       "  ('involve', 0.021002405204526602),\n",
       "  ('card', 0.020807513934122553),\n",
       "  ('neural', 0.020531733338217586),\n",
       "  ('position', 0.01985347314199947),\n",
       "  ('locate', 0.019263134241842842),\n",
       "  ('claim', 0.01897950650885965),\n",
       "  ('base', 0.018926040245664747),\n",
       "  ('humanmachine', 0.01876241940168603),\n",
       "  ('robot', 0.018732185171562245),\n",
       "  ('projectbased', 0.018419336492822284),\n",
       "  ('electronic', 0.018409442405196434),\n",
       "  ('plane', 0.018341891478612964),\n",
       "  ('humancomputer', 0.01802445904046314),\n",
       "  ('control', 0.017789258091881727),\n",
       "  ('identify', 0.01741627674902387),\n",
       "  ('filter', 0.016597191882868362),\n",
       "  ('network', 0.016471767656720045),\n",
       "  ('vision', 0.016438444280535508),\n",
       "  ('sample', 0.01565857427655682),\n",
       "  ('element', 0.01550010340403137),\n",
       "  ('video', 0.015282397316852856),\n",
       "  ('angle', 0.015281330585484216),\n",
       "  ('preacquired', 0.014775592629425396),\n",
       "  ('collect', 0.014686051727932829),\n",
       "  ('enable', 0.014372107493027444),\n",
       "  ('nonenglish', 0.014310908374107966),\n",
       "  ('step', 0.014286645637296334),\n",
       "  ('draw', 0.014127878749730961),\n",
       "  ('text', 0.013925524883692643),\n",
       "  ('battle', 0.013814502369616712),\n",
       "  ('language', 0.013784066482747511),\n",
       "  ('grasp', 0.013507232746176231),\n",
       "  ('advantage', 0.013366299924586761),\n",
       "  ('accurately', 0.013214499720206633),\n",
       "  ('illustrate', 0.012982586658319365),\n",
       "  ('coordinate', 0.0129525560020088),\n",
       "  ('playing', 0.012915891808100936),\n",
       "  ('frame', 0.012864198080497529),\n",
       "  ('independent', 0.012795486488255913),\n",
       "  ('set', 0.012694382401657494),\n",
       "  ('sharpen', 0.012353767295032536),\n",
       "  ('judgment', 0.012254462686467724),\n",
       "  ('visual', 0.012019634241277107),\n",
       "  ('detection', 0.011785011954775892),\n",
       "  ('arm', 0.01162592610348305),\n",
       "  ('mechanical', 0.011607328319190978),\n",
       "  ('initial', 0.011522892104861758),\n",
       "  ('system', 0.011238211448499612),\n",
       "  ('generate', 0.01105864284638811),\n",
       "  ('diagram', 0.010426822884067731),\n",
       "  ('segmentation', 0.0104128500062285),\n",
       "  ('skeleton', 0.01041169073713191),\n",
       "  ('learning', 0.01024054787190745),\n",
       "  ('interactive', 0.009957833853118695),\n",
       "  ('highpass', 0.009730338930937608),\n",
       "  ('represent', 0.009548890915798013),\n",
       "  ('upload', 0.009461534928734203),\n",
       "  ('color', 0.009440070974905977),\n",
       "  ('machine', 0.009268220115816538),\n",
       "  ('identification', 0.009174643702344495),\n",
       "  ('realize', 0.009152132237655491),\n",
       "  ('result', 0.009131185004174565),\n",
       "  ('stream', 0.008821699039269406),\n",
       "  ('target', 0.00879042064043716),\n",
       "  ('medium', 0.00872552684456245),\n",
       "  ('annotation', 0.008573530626288755),\n",
       "  ('edge', 0.008441200431676961),\n",
       "  ('output', 0.008401342472558379),\n",
       "  ('detect', 0.00827490592499734),\n",
       "  ('movement', 0.00826289430147919)],\n",
       " 27: [('carton', 0.7065022099382622),\n",
       "  ('unloader', 0.3236252322127214),\n",
       "  ('unload', 0.2111665175230914),\n",
       "  ('pile', 0.16963478057076847),\n",
       "  ('conveyor', 0.12880143683599124),\n",
       "  ('robotic', 0.10406834409353577),\n",
       "  ('truck', 0.07284593893594564),\n",
       "  ('attach', 0.06284422477604379),\n",
       "  ('trailer', 0.05574817762870381),\n",
       "  ('dislodge', 0.055422535801988776),\n",
       "  ('arm', 0.05007220628449307),\n",
       "  ('lorry', 0.04303417182659149),\n",
       "  ('mobile', 0.042479305453785574),\n",
       "  ('front', 0.03876648858103226),\n",
       "  ('configure', 0.03547263013575754),\n",
       "  ('movable', 0.0334750811202927),\n",
       "  ('portion', 0.03328814647065748),\n",
       "  ('article', 0.033209968044495594),\n",
       "  ('load', 0.03233454178606173),\n",
       "  ('positioner', 0.032017928318441684),\n",
       "  ('movably', 0.031849830918208685),\n",
       "  ('system', 0.03125107681222144),\n",
       "  ('straddle', 0.029732629678081192),\n",
       "  ('floor', 0.02950381728629244),\n",
       "  ('conformable', 0.029432465165738924),\n",
       "  ('shelf', 0.02832642380835489),\n",
       "  ('location', 0.028322339503552896),\n",
       "  ('move', 0.027075053489346548),\n",
       "  ('vacuum', 0.026963098447985476),\n",
       "  ('manipulator', 0.025435318293945325),\n",
       "  ('laborer', 0.024777191398400993),\n",
       "  ('semitrailer', 0.024527054304782435),\n",
       "  ('contact', 0.024319106910865536),\n",
       "  ('conform', 0.023887373188656514),\n",
       "  ('raise', 0.0236310507373271),\n",
       "  ('distribution', 0.023506574249613874),\n",
       "  ('stack', 0.023231293866212734),\n",
       "  ('center', 0.023131701056471554),\n",
       "  ('warehouse', 0.022562292733725776),\n",
       "  ('body', 0.02199808022815012),\n",
       "  ('irregularity', 0.021983071313850362),\n",
       "  ('unloading', 0.021291869685544355),\n",
       "  ('descrambling', 0.021277096833018528),\n",
       "  ('frame', 0.020820031719032447),\n",
       "  ('minimize', 0.020533356301165075),\n",
       "  ('convey', 0.020212949209870885),\n",
       "  ('bulk', 0.01952529766924112),\n",
       "  ('remover', 0.01897046624615082),\n",
       "  ('catch', 0.018870061431352676),\n",
       "  ('item', 0.0184888111320154),\n",
       "  ('lift', 0.0184855172885612),\n",
       "  ('retract', 0.018346317243531675),\n",
       "  ('provide', 0.018164353653366508),\n",
       "  ('reconfigure', 0.017815696849040604),\n",
       "  ('view', 0.01765745798464732),\n",
       "  ('rest', 0.017603375724764225),\n",
       "  ('frontend', 0.017375291079086745),\n",
       "  ('rod', 0.017317565266110682),\n",
       "  ('access', 0.01718275851926793),\n",
       "  ('box', 0.01706743848878208),\n",
       "  ('bay', 0.016859568043931836),\n",
       "  ('configuration', 0.016573295616035853),\n",
       "  ('throughput', 0.01641889589191228),\n",
       "  ('unloaders', 0.016309217276416803),\n",
       "  ('cargo', 0.015720758374526075),\n",
       "  ('retrieval', 0.015272087944607457),\n",
       "  ('flexibility', 0.015265364169495421),\n",
       "  ('organization', 0.015232937060920958),\n",
       "  ('freezer', 0.015032224395668967),\n",
       "  ('reduce', 0.014870508827054991),\n",
       "  ('store', 0.014350585522835234),\n",
       "  ('counterbalance', 0.01433648736115472),\n",
       "  ('bumper', 0.01406912666599685),\n",
       "  ('require', 0.01373983988142677),\n",
       "  ('obstruction', 0.013452449844577425),\n",
       "  ('quantity', 0.013436353660059361),\n",
       "  ('draw', 0.013431325551531021),\n",
       "  ('visualization', 0.013196632057738),\n",
       "  ('orientation', 0.01307743241274511),\n",
       "  ('maximize', 0.01290569488394855),\n",
       "  ('maneuver', 0.012829498895467575),\n",
       "  ('isometric', 0.01280628606872168),\n",
       "  ('advantage', 0.012707295191781574),\n",
       "  ('rear', 0.012356147214612158),\n",
       "  ('effort', 0.012297328356616875),\n",
       "  ('loader', 0.012270527594542767),\n",
       "  ('aisle', 0.012211119029065494),\n",
       "  ('control', 0.012003764379566784),\n",
       "  ('fall', 0.011854771736520577),\n",
       "  ('vision', 0.011851212270282135),\n",
       "  ('subsequent', 0.011619879376751716),\n",
       "  ('dock', 0.01156609329518328),\n",
       "  ('pas', 0.01137127644742306),\n",
       "  ('cost', 0.01128062004078666),\n",
       "  ('facility', 0.011109492620761826),\n",
       "  ('product', 0.010670387670683885),\n",
       "  ('efficiently', 0.01059247380601043),\n",
       "  ('basic', 0.010556986562485599),\n",
       "  ('capture', 0.010530150545767666),\n",
       "  ('unloads', 0.010447143052370154)]}"
      ]
     },
     "execution_count": 43,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 4查看每一个主题的关键词\n",
    "new_topic.get_topics()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 44,
   "id": "44041d0f",
   "metadata": {},
   "outputs": [],
   "source": [
    "# 保存主题、关键词\n",
    "topic_keywords = new_topic.get_topics()\n",
    "import pickle\n",
    "# with open(r'D:\\jupyter\\DK\\DK数据\\2数据处理\\3聚类\\2应用研究\\4主题—主题词.pkl','wb') as f:\n",
    "#     pickle.dump(topic_keywords, f)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 45,
   "id": "2ace8cdf",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "29"
      ]
     },
     "execution_count": 45,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "len(topic_keywords)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 46,
   "id": "f4990e2a",
   "metadata": {},
   "outputs": [],
   "source": [
    "DF1 = pd.DataFrame(topic_keywords)\n",
    "DF1.head()\n",
    "DF1.to_excel(r'D:\\jupyter\\DK\\DK数据\\2数据处理\\3聚类\\2应用研究\\4主题-主题词概率.xlsx',index = False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 47,
   "id": "0879277a",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>-1</th>\n",
       "      <th>0</th>\n",
       "      <th>1</th>\n",
       "      <th>2</th>\n",
       "      <th>3</th>\n",
       "      <th>4</th>\n",
       "      <th>5</th>\n",
       "      <th>6</th>\n",
       "      <th>7</th>\n",
       "      <th>8</th>\n",
       "      <th>...</th>\n",
       "      <th>18</th>\n",
       "      <th>19</th>\n",
       "      <th>20</th>\n",
       "      <th>21</th>\n",
       "      <th>22</th>\n",
       "      <th>23</th>\n",
       "      <th>24</th>\n",
       "      <th>25</th>\n",
       "      <th>26</th>\n",
       "      <th>27</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>robot</td>\n",
       "      <td>robot</td>\n",
       "      <td>wafer</td>\n",
       "      <td>fruit</td>\n",
       "      <td>mow</td>\n",
       "      <td>catheter</td>\n",
       "      <td>pipe</td>\n",
       "      <td>sample</td>\n",
       "      <td>print</td>\n",
       "      <td>fire</td>\n",
       "      <td>...</td>\n",
       "      <td>cloth</td>\n",
       "      <td>shoe</td>\n",
       "      <td>medicine</td>\n",
       "      <td>substation</td>\n",
       "      <td>sterilize</td>\n",
       "      <td>paint</td>\n",
       "      <td>steel</td>\n",
       "      <td>tire</td>\n",
       "      <td>chess</td>\n",
       "      <td>carton</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>method</td>\n",
       "      <td>weld</td>\n",
       "      <td>semiconductor</td>\n",
       "      <td>harvest</td>\n",
       "      <td>grass</td>\n",
       "      <td>ablation</td>\n",
       "      <td>pipeline</td>\n",
       "      <td>cell</td>\n",
       "      <td>printing</td>\n",
       "      <td>firefighting</td>\n",
       "      <td>...</td>\n",
       "      <td>garment</td>\n",
       "      <td>glue</td>\n",
       "      <td>pharmacy</td>\n",
       "      <td>inspection</td>\n",
       "      <td>disinfection</td>\n",
       "      <td>painting</td>\n",
       "      <td>iron</td>\n",
       "      <td>rim</td>\n",
       "      <td>chessboard</td>\n",
       "      <td>unloader</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>system</td>\n",
       "      <td>method</td>\n",
       "      <td>transfer</td>\n",
       "      <td>pick</td>\n",
       "      <td>mower</td>\n",
       "      <td>capsule</td>\n",
       "      <td>pipette</td>\n",
       "      <td>blood</td>\n",
       "      <td>additive</td>\n",
       "      <td>extinguish</td>\n",
       "      <td>...</td>\n",
       "      <td>textile</td>\n",
       "      <td>sole</td>\n",
       "      <td>medication</td>\n",
       "      <td>transformer</td>\n",
       "      <td>disinfect</td>\n",
       "      <td>artwork</td>\n",
       "      <td>alloy</td>\n",
       "      <td>wheel</td>\n",
       "      <td>chessman</td>\n",
       "      <td>unload</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>control</td>\n",
       "      <td>system</td>\n",
       "      <td>chamber</td>\n",
       "      <td>cut</td>\n",
       "      <td>lawn</td>\n",
       "      <td>brachytherapy</td>\n",
       "      <td>inspection</td>\n",
       "      <td>dna</td>\n",
       "      <td>manufacturing</td>\n",
       "      <td>flame</td>\n",
       "      <td>...</td>\n",
       "      <td>sew</td>\n",
       "      <td>spray</td>\n",
       "      <td>drug</td>\n",
       "      <td>meter</td>\n",
       "      <td>clean</td>\n",
       "      <td>artistic</td>\n",
       "      <td>core</td>\n",
       "      <td>test</td>\n",
       "      <td>game</td>\n",
       "      <td>pile</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>position</td>\n",
       "      <td>control</td>\n",
       "      <td>position</td>\n",
       "      <td>meat</td>\n",
       "      <td>cut</td>\n",
       "      <td>robotic</td>\n",
       "      <td>robot</td>\n",
       "      <td>protein</td>\n",
       "      <td>printer</td>\n",
       "      <td>water</td>\n",
       "      <td>...</td>\n",
       "      <td>clothes</td>\n",
       "      <td>footwear</td>\n",
       "      <td>storage</td>\n",
       "      <td>equipment</td>\n",
       "      <td>epidemic</td>\n",
       "      <td>artist</td>\n",
       "      <td>temperature</td>\n",
       "      <td>sealant</td>\n",
       "      <td>image</td>\n",
       "      <td>conveyor</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>5 rows × 29 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "        -1        0              1        2      3              4   \\\n",
       "0     robot    robot          wafer    fruit    mow       catheter   \n",
       "1    method     weld  semiconductor  harvest  grass       ablation   \n",
       "2    system   method       transfer     pick  mower        capsule   \n",
       "3   control   system        chamber      cut   lawn  brachytherapy   \n",
       "4  position  control       position     meat    cut        robotic   \n",
       "\n",
       "           5        6              7             8   ...       18        19  \\\n",
       "0        pipe   sample          print          fire  ...    cloth      shoe   \n",
       "1    pipeline     cell       printing  firefighting  ...  garment      glue   \n",
       "2     pipette    blood       additive    extinguish  ...  textile      sole   \n",
       "3  inspection      dna  manufacturing         flame  ...      sew     spray   \n",
       "4       robot  protein        printer         water  ...  clothes  footwear   \n",
       "\n",
       "           20           21            22        23           24       25  \\\n",
       "0    medicine   substation     sterilize     paint        steel     tire   \n",
       "1    pharmacy   inspection  disinfection  painting         iron      rim   \n",
       "2  medication  transformer     disinfect   artwork        alloy    wheel   \n",
       "3        drug        meter         clean  artistic         core     test   \n",
       "4     storage    equipment      epidemic    artist  temperature  sealant   \n",
       "\n",
       "           26        27  \n",
       "0       chess    carton  \n",
       "1  chessboard  unloader  \n",
       "2    chessman    unload  \n",
       "3        game      pile  \n",
       "4       image  conveyor  \n",
       "\n",
       "[5 rows x 29 columns]"
      ]
     },
     "execution_count": 47,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dic = {}\n",
    "for k,v in topic_keywords.items():\n",
    "    ls = []\n",
    "    for i in v:\n",
    "        ls.append(i[0])\n",
    "    dic[k] = ls\n",
    "    \n",
    "DF3 = pd.DataFrame(dic)\n",
    "DF3.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 48,
   "id": "d0c09199",
   "metadata": {},
   "outputs": [],
   "source": [
    "DF3.to_excel(r'D:\\jupyter\\DK\\DK数据\\2数据处理\\3聚类\\2应用研究\\4主题-主题词.xlsx',index = False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "376f03d6",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 49,
   "id": "ed11d592",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'calculate_probabilities': True,\n",
       " 'ctfidf_model': ClassTfidfTransformer(),\n",
       " 'embedding_model': <bertopic.backend._sentencetransformers.SentenceTransformerBackend at 0x1a0d8021180>,\n",
       " 'hdbscan_model': HDBSCAN(min_cluster_size=10, prediction_data=True),\n",
       " 'language': 'english',\n",
       " 'low_memory': False,\n",
       " 'min_topic_size': 10,\n",
       " 'n_gram_range': (1, 1),\n",
       " 'nr_topics': 'auto',\n",
       " 'representation_model': None,\n",
       " 'seed_topic_list': None,\n",
       " 'top_n_words': 100,\n",
       " 'umap_model': UMAP(angular_rp_forest=True, low_memory=False, metric='cosine', min_dist=0.0, n_components=5, tqdm_kwds={'bar_format': '{desc}: {percentage:3.0f}%| {bar} {n_fmt}/{total_fmt} [{elapsed}]', 'desc': 'Epochs completed', 'disable': True}),\n",
       " 'vectorizer_model': CountVectorizer(),\n",
       " 'verbose': True}"
      ]
     },
     "execution_count": 49,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 5获取参数\n",
    "new_topic.get_params()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 50,
   "id": "faf618d1",
   "metadata": {},
   "outputs": [],
   "source": [
    "# 6 保存模型\n",
    "new_topic.save(r\"D:\\jupyter\\DK\\DK数据\\2数据处理\\3聚类\\2应用研究\\yingyong_yanjiu_model\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "1ab3990e",
   "metadata": {},
   "outputs": [],
   "source": [
    "# 7 加载模型\n",
    "model = BERTopic.load(r\"D:\\jupyter\\DK\\DK数据\\2数据处理\\3聚类\\2应用研究\\yingyong_yanjiu_model\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "df4d0ca0",
   "metadata": {},
   "outputs": [],
   "source": [
    "# model.get_topics()"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.9"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
